Mercurial > repos > rnateam > sortmerna
comparison sortmerna.xml @ 5:233da82dc31c draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/sortmerna commit 4febb4056eb7b379edc0f3e7719a50e575a749c8
author | rnateam |
---|---|
date | Wed, 09 Dec 2015 09:21:28 -0500 |
parents | e6727cef3083 |
children | 97f73e0566c9 |
comparison
equal
deleted
inserted
replaced
4:e6727cef3083 | 5:233da82dc31c |
---|---|
1 <tool id="bg_sortmerna" name="Filter with SortMeRNA" version="2.0.0"> | 1 <tool id="bg_sortmerna" name="Filter with SortMeRNA" version="2.1.0"> |
2 <description>Fast and accurate filtering of ribosomal RNAs in metatranscriptomic data</description> | 2 <description>Fast and accurate filtering of ribosomal RNAs in metatranscriptomic data</description> |
3 <requirements> | 3 <requirements> |
4 <requirement type='package' version="2.0">sortmerna</requirement> | 4 <requirement type='package' version="2.0">sortmerna</requirement> |
5 </requirements> | 5 </requirements> |
6 <stdio> | 6 <stdio> |
20 </version_command> | 20 </version_command> |
21 <command> | 21 <command> |
22 <![CDATA[ | 22 <![CDATA[ |
23 #set $ref = '' | 23 #set $ref = '' |
24 #set $sep='' | 24 #set $sep='' |
25 #if str( $databases_type.databases_selector ) == 'history': | 25 #if str( $databases_type.databases_selector ) == 'history' |
26 #for $db in $databases_type.database_name | 26 #for $db in $databases_type.database_name |
27 #set $ref += $sep + str($db) + ',' + $os.path.splitext($os.path.basename(str($db)))[0] | 27 #set $ref += $sep + str($db) + ',' + $os.path.splitext($os.path.basename(str($db)))[0] |
28 #set $sep = ':' | 28 #set $sep = ':' |
29 #end for | 29 #end for |
30 indexdb_rna --ref $ref | 30 #else if str( $databases_type.databases_selector ) == 'cached_to_index' |
31 && | 31 ## databases path is not directly accessible, must match by hand with LOC file contents |
32 #set $data_table = dict([(_[0], _[2]) for _ in $databases_type.input_databases.input.options.tool_data_table.data]) | |
33 #for $db in $databases_type.input_databases.value | |
34 #set $ref += $sep + $data_table[$db] + ',' + $os.path.splitext($data_table[$db])[0] + '-reindexed' | |
35 #set $sep = ':' | |
36 #end for | |
32 #else: | 37 #else: |
33 ## databases path is not directly accessible, must match by hand with LOC file contents | 38 ## databases path is not directly accessible, must match by hand with LOC file contents |
34 #set $data_table = dict([(_[0], _[2]) for _ in $databases_type.input_databases.input.options.tool_data_table.data]) | 39 #set $data_table = dict([(_[0], _[2]) for _ in $databases_type.input_databases.input.options.tool_data_table.data]) |
35 #for $db in $databases_type.input_databases.value | 40 #for $db in $databases_type.input_databases.value |
36 #set $ref += $sep + $data_table[$db] + ',' + $os.path.splitext($data_table[$db])[0] | 41 #set $ref += $sep + $data_table[$db] + ',' + $os.path.splitext($data_table[$db])[0] |
37 #set $sep = ':' | 42 #set $sep = ':' |
38 #end for | 43 #end for |
39 #end if | 44 #end if |
40 sortmerna --ref $ref --reads $input_reads --aligned aligned | 45 |
41 #if str( $sequencing_type.sequencing_type_selector ) == 'paired' | 46 #if str( $databases_type.databases_selector ) != 'cached': |
42 $sequencing_type.paired_type | 47 indexdb_rna |
48 --ref $ref | |
49 -L $databases_type.seed_length | |
50 --max_pos $databases_type.max_pos | |
51 && | |
43 #end if | 52 #end if |
44 $strand_search | 53 |
45 $aligned_fastx.aligned_fastx_selector | 54 sortmerna |
46 #if $aligned_fastx.aligned_fastx_selector == '--fastx' | 55 --ref $ref |
47 #if $aligned_fastx.other | 56 --reads $input_reads |
48 --other other_file | 57 --aligned aligned |
58 | |
59 #if str( $sequencing_type.sequencing_type_selector ) == 'paired' | |
60 $sequencing_type.paired_type | |
61 #end if | |
62 | |
63 $strand_search | |
64 $aligned_fastx.aligned_fastx_selector | |
65 #if $aligned_fastx.aligned_fastx_selector == '--fastx' | |
66 #if $aligned_fastx.other | |
67 --other other_file | |
68 #end if | |
69 #end if | |
70 $aligned_sam.aligned_sam_selector | |
71 #if $aligned_sam.aligned_sam_selector == '--sam' | |
72 $aligned_sam.sq | |
73 #end if | |
74 $aligned_blast | |
75 | |
76 $log | |
77 | |
78 #if $report.report_type == 'best' | |
79 #if $report.report_best.report_best_type == '0' | |
80 --best 0 | |
81 #else if $report.report_best.report_best_type == '1' | |
82 --best 1 | |
83 --min_lis $report.report_best.report_best_min_lis | |
84 #else | |
85 --best $report.report_best.report_best_value | |
86 --min_lis $report.report_best.report_best_min_lis | |
87 #end if | |
88 #else | |
89 #if $report.report_num_alignments.report_num_alignments_type == 'other_value' | |
90 --num_alignments $report.report_num_alignments.report_num_alignments_value | |
91 #else | |
92 --num_alignments $report.report_num_alignments.report_num_alignments_type | |
93 #end if | |
49 #end if | 94 #end if |
50 #end if | 95 |
51 $aligned_sam.aligned_sam_selector | 96 -e $e_value |
52 #if $aligned_sam.aligned_sam_selector == '--sam' | 97 --match $match |
53 $aligned_sam.sq | 98 --mismatch $mismatch |
54 #end if | 99 --gap_open $gap_open |
55 $aligned_blast | 100 --gap_ext $gap_ext |
56 $log | 101 -N $ambiguous_letter |
57 -a \${GALAXY_SLOTS:-1} | 102 -a \${GALAXY_SLOTS:-1} |
58 ]]> | 103 ]]> |
59 </command> | 104 </command> |
60 <inputs> | 105 <inputs> |
61 <param format="fasta,fastq" name="input_reads" type="data" label="Querying sequences" help="In FASTA or FASTQ format (--reads)"/> | 106 <param format="fasta,fastq" name="input_reads" type="data" label="Querying sequences" help="In FASTA or FASTQ format (--reads)"/> |
62 <conditional name="sequencing_type"> | 107 <conditional name="sequencing_type"> |
63 <param name="sequencing_type_selector" type="select" label="Sequencing type"> | 108 <param name="sequencing_type_selector" type="select" label="Sequencing type"> |
64 <option value="not_paired">Reads are not paired</option> | 109 <option value="not_paired">Reads are not paired</option> |
65 <option value="paired">Reads are paired</option> | 110 <option value="paired">Reads are paired</option> |
66 </param> | 111 </param> |
112 <when value="not_paired" /> | |
67 <when value="paired"> | 113 <when value="paired"> |
68 <param name="paired_type" type="select" display="radio" label="If one of the paired-end reads aligns and the other one does not"> | 114 <param name="paired_type" type="select" display="radio" label="If one of the paired-end reads aligns and the other one does not"> |
69 <option value="">leave the reads split between aligned and rejected files</option> | 115 <option value="">leave the reads split between aligned and rejected files</option> |
70 <option value="--paired-in">output both reads to aligned file (--paired-in)</option> | 116 <option value="--paired-in">output both reads to aligned file (--paired-in)</option> |
71 <option value="--paired-out">output both reads to rejected file (--paired-out)</option> | 117 <option value="--paired-out">output both reads to rejected file (--paired-out)</option> |
72 </param> | 118 </param> |
73 </when> | 119 </when> |
74 </conditional> | 120 </conditional> |
75 | 121 |
76 <param name="strand_search" type="select" label="Which strands to search" display="radio"> | 122 <param name="strand_search" type="select" label="Which strands to search"> |
77 <option value="">Search both strands</option> | 123 <option value="">Search both strands</option> |
78 <option value="-F">Search only the forward strand (-F)</option> | 124 <option value="-F">Search only the forward strand (-F)</option> |
79 <option value="-R">Search only the reverse-complementary strand (-R)</option> | 125 <option value="-R">Search only the reverse-complementary strand (-R)</option> |
80 </param> | 126 </param> |
81 | 127 |
82 <conditional name="databases_type"> | 128 <conditional name="databases_type"> |
83 <param name="databases_selector" type="select" label="Databases to query" | 129 <param name="databases_selector" type="select" label="Databases to query" |
84 help="Public rRNA databases provided with SortMeRNA have been indexed. | 130 help="Public rRNA databases provided with SortMeRNA have been indexed. |
85 On the contrary, personal databases must be indexed each time SortMeRNA is launched. | 131 On the contrary, personal databases must be indexed each time SortMeRNA is launched. |
86 Please be patient, this may take some time depending on the size of the given database."> | 132 Please be patient, this may take some time depending on the size of the given database."> |
87 <option value="cached" selected="true">Public ribosomal databases</option> | 133 <option value="cached" selected="true">Public pre-indexed ribosomal databases</option> |
134 <option value="cached_to_index">Public ribosomal databases to index with non default parameters</option> | |
88 <option value="history">Databases from your history</option> | 135 <option value="history">Databases from your history</option> |
89 </param> | 136 </param> |
90 <when value="cached"> | 137 <when value="cached"> |
91 <param name="input_databases" label="rRNA databases" type="select" display="checkboxes" multiple="true"> | 138 <param name="input_databases" label="rRNA databases" type="select" display="checkboxes" multiple="true"> |
92 <options from_data_table="rRNA_databases" /> | 139 <options from_data_table="rRNA_databases" /> |
93 <validator type="no_options" message="Select at least one database"/> | 140 <validator type="no_options" message="Select at least one database"/> |
94 </param> | 141 </param> |
95 </when> | 142 </when> |
143 <when value="cached_to_index"> | |
144 <param name="input_databases" label="rRNA databases" type="select" display="checkboxes" multiple="true"> | |
145 <options from_data_table="rRNA_databases" /> | |
146 <validator type="no_options" message="Select at least one database"/> | |
147 </param> | |
148 <param name="seed_length" type="integer" min="0" max="100" value="18" label="Seed length for database indexing" help="(-L)"/> | |
149 <param name="max_pos" type="integer" min="0" max="100000" value="10000" label="Maximum number of positions to store for each k-mer for database indexing" help="With 0, all positions are stored (--max_pos)"/> | |
150 </when> | |
96 <when value="history"> | 151 <when value="history"> |
97 <param name="database_name" type="data" format="fasta" multiple="true" label="rRNA databases" | 152 <param name="database_name" type="data" format="fasta" multiple="true" label="rRNA databases" |
98 help="Your databases will be indexed first, which may take up to several minutes."/> | 153 help="Your databases will be indexed first, which may take up to several minutes."/> |
154 <param name="seed_length" type="integer" min="0" max="100" value="18" label="Seed length for database indexing" help="(-L)"/> | |
155 <param name="max_pos" type="integer" min="0" max="100000" value="10000" label="Maximum number of positions to store for each k-mer for database indexing" help="With 0, all positions are stored (--max_pos)"/> | |
99 </when> | 156 </when> |
100 </conditional> | 157 </conditional> |
101 | 158 |
102 <!-- Outputs --> | 159 <!-- Outputs --> |
103 <conditional name="aligned_fastx"> | 160 <conditional name="aligned_fastx"> |
104 <param name="aligned_fastx_selector" type="select" label="Include aligned reads in FASTA/FASTQ format"> | 161 <param name="aligned_fastx_selector" type="select" label="Include aligned reads in FASTA/FASTQ format?"> |
105 <option value="--fastx">Yes (--fastx)</option> | 162 <option value="--fastx">Yes (--fastx)</option> |
106 <option value="">No</option> | 163 <option value="">No</option> |
107 </param> | 164 </param> |
108 <when value="--fastx"> | 165 <when value="--fastx"> |
109 <param name="other" type="boolean" label="Include rejected reads file" help="(--other)" /> | 166 <param name="other" type="boolean" label="Include rejected reads file?" help="(--other)" /> |
110 </when> | 167 </when> |
111 <when value="" /> | 168 <when value="" /> |
112 </conditional> | 169 </conditional> |
113 <conditional name="aligned_sam"> | 170 <conditional name="aligned_sam"> |
114 <param name="aligned_sam_selector" type="select" label="Include alignments in SAM format"> | 171 <param name="aligned_sam_selector" type="select" label="Include alignments in SAM format?"> |
115 <option value="--sam">Yes (--sam)</option> | 172 <option value="--sam">Yes (--sam)</option> |
116 <option value="">No</option> | 173 <option value="">No</option> |
117 </param> | 174 </param> |
118 <when value="--sam"> | 175 <when value="--sam"> |
119 <param name="sq" type="boolean" truevalue="--SQ" falsevalue="" label="Add SQ tags to the SAM file" help="(--SQ)" /> | 176 <param name="sq" type="boolean" truevalue="--SQ" falsevalue="" label="Add SQ tags to the SAM file" help="(--SQ)" /> |
128 <option value="" selected="true">No</option> | 185 <option value="" selected="true">No</option> |
129 </param> | 186 </param> |
130 <param name="log" type="boolean" checked="False" truevalue="--log" falsevalue="" label="Generate statistics file" | 187 <param name="log" type="boolean" checked="False" truevalue="--log" falsevalue="" label="Generate statistics file" |
131 help="Generates statistics for the rRNA content of reads, as well as rRNA subunit distribution. (--log)"> | 188 help="Generates statistics for the rRNA content of reads, as well as rRNA subunit distribution. (--log)"> |
132 </param> | 189 </param> |
190 <conditional name="report"> | |
191 <param name="report_type" type="select" label="Parameters for filtering and read mapping" help=""> | |
192 <option value="best" selected="true">Report best alignments per read reaching E-value</option> | |
193 <option value="num_alignments">Report first alignements per read reaching E-value</option> | |
194 </param> | |
195 <when value="best"> | |
196 <conditional name="report_best"> | |
197 <param name="report_best_type" type="select" label="Number of searched alignments" help="Only the best alignment is reported (--best)"> | |
198 <option value="0">All high-candidate reference sequences are searched for alignments (very slow)</option> | |
199 <option value="1" selected="true">Only one high-candidate reference sequence is searched for alignments (fast). The high-candidate sequences are determined heuristically using a LIS of seed matches)</option> | |
200 <option value="other_value">A custom number of reference sequences are searched for alignments (speed decrease for high value)</option> | |
201 </param> | |
202 <when value="0" /> | |
203 <when value="1"> | |
204 <param name="report_best_min_lis" type="integer" min="0" max="100" value="2" label="Number of longest LIS an alignement needs to be searched" help="The alignements having the first INT longest LIS. LIS stands for Longest Increasing Subsequence, it is computed using seeds' positions to expand hits into longer matches prior to Smith-Waterman alignment. (--min_lis)"/> | |
205 </when> | |
206 <when value="other_value"> | |
207 <param name="report_best_value" type="integer" min="2" max="100" value="2" label="Number of alignments to be made" help="Only the best one is reported. The computation speed decrease with high value"/> | |
208 <param name="report_best_min_lis" type="integer" min="0" max="100" value="2" label="Number of longest LIS an alignement needs to be searched" help="The alignements having the first INT longest LIS. LIS stands for Longest Increasing Subsequence, it is computed using seeds' positions to expand hits into longer matches prior to Smith-Waterman alignment. (--min_lis)"/> | |
209 </when> | |
210 </conditional> | |
211 </when> | |
212 <when value="num_alignments"> | |
213 <conditional name="report_num_alignments"> | |
214 <param name="report_num_alignments_type" type="select" label="Number of output alignments" help="(--num_alignments)"> | |
215 <option value="0">All alignments reaching the E-value threshold are reported (very slow, this option is not suggested for high similarity rRNA databases)</option> | |
216 <option value="1" selected="true">The first alignment passing E-value threshold are reported (very fast, best choice if only filtering is needed)</option> | |
217 <option value="other_value">A custom number of alignments are made and reported (speed decrease for high value)</option> | |
218 </param> | |
219 <when value="0" /> | |
220 <when value="1" /> | |
221 <when value="other_value"> | |
222 <param name="report_num_alignments_value" type="integer" min="0" max="100" value="1" label="Number of alignments to be made and reported" help=""/> | |
223 </when> | |
224 </conditional> | |
225 </when> | |
226 </conditional> | |
227 | |
228 <param name="e_value" type="float" min="0" max="10" value="1" label="E-value threshold" help="(-e)"/> | |
229 <param name="match" type="integer" min="0" max="10" value="2" label="SW score for a match" help="(--match)"/> | |
230 <param name="mismatch" type="integer" min="-10" max="0" value="-3" label="SW penalty for a mismatch" help="(--mismatch)"/> | |
231 <param name="gap_open" type="integer" min="0" max="10" value="5" label="SW penalty for introducing a gap" help="(--gap_open)"/> | |
232 <param name="gap_ext" type="integer" min="0" max="10" value="2" label="SW penalty for extending a gap" help="(--gap_ext)"/> | |
233 <param name="ambiguous_letter" type="integer" min="-10" max="0" value="-3" label="SW penalty for ambiguous letters (N's)" help="(-N)"/> | |
133 </inputs> | 234 </inputs> |
134 <outputs> | 235 <outputs> |
135 <data format_source="input_reads" name="output_fastx" from_work_dir="aligned.dat" | 236 <data format_source="input_reads" name="output_fastx" from_work_dir="aligned.dat" |
136 label="Aligned reads on ${on_string} (${input_reads.datatype.file_ext})"> | 237 label="Aligned reads on ${on_string} (${input_reads.datatype.file_ext})"> |
137 <filter>aligned_fastx['aligned_fastx_selector']</filter> | 238 <filter>aligned_fastx['aligned_fastx_selector']</filter> |
243 | 344 |
244 The user may also choose to use their own rRNA databases. | 345 The user may also choose to use their own rRNA databases. |
245 | 346 |
246 .. class:: warningmark | 347 .. class:: warningmark |
247 | 348 |
248 Note that your personal databases are indexed each time, and that | 349 Note that your personal databases are indexed each time. The public ribosomal |
249 this may take some time depending on the size of the given database. | 350 databases are indexed when added, but they can be re-indexed with non-default indexing |
351 parameters. The indexing may take some time depending on the size of the given database. | |
352 | |
250 ]]> | 353 ]]> |
251 </help> | 354 </help> |
252 | 355 |
253 <citations> | 356 <citations> |
254 <citation type="doi">10.1093/bioinformatics/bts611</citation> | 357 <citation type="doi">10.1093/bioinformatics/bts611</citation> |