Mercurial > repos > rnateam > mirdeep2_mapper
comparison mapper.xml @ 3:79fdac89dd6e draft default tip
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mirdeep2/mirdeep2_mapper commit 04c75332ac618b43ce5c3f307f7866e97147e865
author | rnateam |
---|---|
date | Thu, 05 Apr 2018 08:54:49 -0400 |
parents | f844a9c1698d |
children |
comparison
equal
deleted
inserted
replaced
2:f844a9c1698d | 3:79fdac89dd6e |
---|---|
1 <tool id="rbc_mirdeep2_mapper" name="MiRDeep2 Mapper" version="2.0.0"> | 1 <tool id="rbc_mirdeep2_mapper" name="MiRDeep2 Mapper" version="2.0.0.8.1"> |
2 <description>process and map reads to a reference genome</description> | |
2 <macros> | 3 <macros> |
3 <macro name="map_params"> | 4 <macro name="map_params"> |
4 <conditional name="refGenomeSource"> | 5 <conditional name="refGenomeSource"> |
5 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Map to genome. (-p)"> | 6 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Map to genome. (-p)"> |
6 <option value="indexed">Use a built-in index</option> | 7 <option value="indexed">Use a built-in index</option> |
13 <validator type="no_options" message="No indexes are available for the selected input dataset"/> | 14 <validator type="no_options" message="No indexes are available for the selected input dataset"/> |
14 </options> | 15 </options> |
15 </param> | 16 </param> |
16 </when> <!-- build-in --> | 17 </when> <!-- build-in --> |
17 <when value="history"> | 18 <when value="history"> |
18 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" /> | 19 <param name="ownFile" type="data" format="fasta" label="Select the reference genome" /> |
19 </when> <!-- history --> | 20 </when> <!-- history --> |
20 </conditional> <!-- refGenomeSource --> | 21 </conditional> <!-- refGenomeSource --> |
21 <param name="map_mismatch" type="boolean" truevalue="-q" falsevalue="" checked="false" label="Map with one mismatch in the seed (mapping takes longer)" help="(-q)"/> | 22 <param name="map_mismatch" type="boolean" truevalue="-q" falsevalue="" checked="false" label="Map with one mismatch in the seed (mapping takes longer)" help="(-q)"/> |
22 <param name="map_threshold" value="5" type="integer" optional="false" label="A read is allowed to map up to this number of positions in the genome" help="Map threshold. (-r)"> | 23 <param name="map_threshold" value="5" type="integer" optional="false" label="A read is allowed to map up to this number of positions in the genome" help="Map threshold. (-r)"> |
23 <validator type="in_range" min="1" message="Minimum value is 1"/> | 24 <validator type="in_range" min="1" message="Minimum value is 1"/> |
24 </param> | 25 </param> |
25 </macro> | 26 </macro> |
26 </macros> | 27 </macros> |
27 <description> | 28 <requirements> |
29 <requirement type="package" version="2.0.0.8">mirdeep2</requirement> | |
30 </requirements> | |
31 <command detect_errors="aggressive"> | |
28 <![CDATA[ | 32 <![CDATA[ |
29 process and map reads to a reference genome | |
30 ]]> | |
31 </description> | |
32 <requirements> | |
33 <requirement type="package" version="2.0">mirdeep2_mapper</requirement> | |
34 <requirement type="package" version="0.12.7">bowtie</requirement> | |
35 <requirement type="package" version="5.18.1">perl</requirement> | |
36 </requirements> | |
37 | |
38 <command> | |
39 <![CDATA[ | |
40 | |
41 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" | 33 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" |
42 #if $operation.refGenomeSource.genomeSource == "history" | 34 #if $operation.refGenomeSource.genomeSource == "history" |
43 bowtie-build '$operation.refGenomeSource.ownFile' custom_bowtie_indices && | 35 bowtie-build '$operation.refGenomeSource.ownFile' custom_bowtie_indices && |
44 #end if | 36 #end if |
45 #end if | 37 #end if |
46 | 38 |
47 mapper.pl | 39 mapper.pl |
48 | 40 |
49 '$reads' | 41 #if $input.type == "single": |
50 | 42 '$input.reads' |
51 #if $reads.extension.startswith("fasta") | 43 |
52 -c | 44 #if $input.reads.extension.startswith("fasta") |
53 #else if $reads.extension.startswith("fastq") | 45 -c |
54 -e | 46 #else if $input.reads.extension.startswith("fastq") |
55 -h | 47 -e |
48 -h | |
49 #end if | |
50 #else: | |
51 '$samples' -d | |
52 | |
53 #if $input.reads_list[0].reads.extension.startswith("fasta") | |
54 -c | |
55 #else if $input.reads_list[0].reads.extension.startswith("fastq") | |
56 -e | |
57 -h | |
58 #end if | |
56 #end if | 59 #end if |
57 | 60 |
58 $remove_non_canon | 61 $remove_non_canon |
59 | 62 |
60 $convert_rna_dna | 63 $convert_rna_dna |
61 | 64 |
62 #if $clip_adapter.clip == "true" | 65 #if $clip_adapter.clip == "true" |
63 -k $clip_adapter.adapter_seq | 66 -k $clip_adapter.adapter_seq |
64 #end if | 67 #end if |
66 -l $discard_short_reads | 69 -l $discard_short_reads |
67 | 70 |
68 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_collapse" | 71 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_collapse" |
69 -m -s '$output_reads_collapsed' | 72 -m -s '$output_reads_collapsed' |
70 #end if | 73 #end if |
71 | 74 |
72 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" | 75 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" |
73 -p | 76 -p |
74 | 77 |
75 #if $operation.refGenomeSource.genomeSource == "history" | 78 #if $operation.refGenomeSource.genomeSource == "history" |
76 custom_bowtie_indices | 79 custom_bowtie_indices |
77 #else | 80 #else |
78 '$operation.refGenomeSource.index.fields.path' | 81 '$operation.refGenomeSource.index.fields.path' |
79 #end if | 82 #end if |
80 $operation.map_mismatch | 83 $operation.map_mismatch |
81 -r $operation.map_threshold | 84 -r $operation.map_threshold |
82 | 85 |
83 -t '$output_mapping' | 86 -t '$output_mapping' |
84 #end if | 87 #end if |
85 | 88 |
86 -v -n | 89 -v -n |
87 ]]> | 90 ]]> |
88 </command> | 91 </command> |
89 <stdio> | 92 <configfiles> |
90 <!-- Anything other than zero is an error --> | 93 <configfile name="samples"><![CDATA[#if $input.type == "multiple": |
91 <exit_code range="1:" /> | 94 #for $r in $input.reads_list: |
92 <exit_code range=":-1" /> | 95 $r.reads $r.sample_name |
93 <!-- In case the return code has not been set propery check stderr too --> | 96 #end for |
94 <regex match="Error:" /> | 97 #end if]]></configfile> |
95 <regex match="Exception:" /> | 98 </configfiles> |
96 </stdio> | |
97 <inputs> | 99 <inputs> |
98 <param format="fastq, fasta" name="reads" type="data" optional="false" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/> | 100 <conditional name="input"> |
101 <param name="type" type="select" label="Pool multiple read sets"> | |
102 <option value="single" selected="true">No</option> | |
103 <option value="multiple">Yes</option> | |
104 </param> | |
105 <when value="single"> | |
106 <param format="fastq,fasta" name="reads" type="data" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/> | |
107 </when> | |
108 <when value="multiple"> | |
109 <repeat name="reads_list" title="Reads"> | |
110 <param name="sample_name" value="" type="text" label="Sample name" help="Must be a 3 letters/digits code"> | |
111 <validator type="expression" message="The sample name must be a 3 letters/digits code">len(value) == 3 and value.isalnum()</validator> | |
112 </param> | |
113 <param format="fastq,fasta" name="reads" type="data" optional="false" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/> | |
114 </repeat> | |
115 </when> | |
116 </conditional> | |
99 <param name="remove_non_canon" type="boolean" truevalue="-j" falsevalue="" checked="false" label="Remove reads with non-standard nucleotides" help="Remove all entries that have a sequence that contains letters other than a,c,g,t,u,n,A,C,G,T,U,N. (-j)"/> | 117 <param name="remove_non_canon" type="boolean" truevalue="-j" falsevalue="" checked="false" label="Remove reads with non-standard nucleotides" help="Remove all entries that have a sequence that contains letters other than a,c,g,t,u,n,A,C,G,T,U,N. (-j)"/> |
100 <param name="convert_rna_dna" type="boolean" truevalue="-i" falsevalue="" checked="false" label="Convert RNA to DNA alphabet (to map against genome)" help="(-i)"/> | 118 <param name="convert_rna_dna" type="boolean" truevalue="-i" falsevalue="" checked="false" label="Convert RNA to DNA alphabet (to map against genome)" help="(-i)"/> |
101 | 119 |
102 <conditional name="clip_adapter"> | 120 <conditional name="clip_adapter"> |
103 <param name="clip" type="select" label="Clip 3' Adapter Sequence" help="(-k)"> | 121 <param name="clip" type="select" label="Clip 3' Adapter Sequence" help="(-k)"> |
109 <validator type="regex" message="Adapter can ONLY contain a,c,g,t,u,n,A,C,G,T,U,N">^[ACGTUacgtu]+$</validator> | 127 <validator type="regex" message="Adapter can ONLY contain a,c,g,t,u,n,A,C,G,T,U,N">^[ACGTUacgtu]+$</validator> |
110 </param> | 128 </param> |
111 </when> | 129 </when> |
112 <when value="false"/> | 130 <when value="false"/> |
113 </conditional> | 131 </conditional> |
114 | 132 |
115 <param name="discard_short_reads" value="18" type="integer" optional="false" label="Discard reads shorter than this length" help="Set to 0 to keep all reads. (-l)"> | 133 <param name="discard_short_reads" value="18" type="integer" optional="false" label="Discard reads shorter than this length" help="Set to 0 to keep all reads. (-l)"> |
116 <validator type="in_range" min="0" message="Minimum value is 0"/> | 134 <validator type="in_range" min="0" message="Minimum value is 0"/> |
117 </param> | 135 </param> |
118 | 136 |
119 <conditional name="operation"> | 137 <conditional name="operation"> |
120 <param name="collapse_map" type="select" label="Collapse reads and/or Map" help="(-m) and/or (-p)"> | 138 <param name="collapse_map" type="select" label="Collapse reads and/or Map" help="(-m) and/or (-p)"> |
121 <option value="collapse_and_map">Collapse reads and Map</option> | 139 <option value="collapse_and_map">Collapse reads and Map</option> |
122 <option value="only_map">Map</option> | 140 <option value="only_map">Map</option> |
123 <option value="only_collapse">Collapse</option> | 141 <option value="only_collapse">Collapse</option> |
149 </filter> | 167 </filter> |
150 </data> | 168 </data> |
151 </outputs> | 169 </outputs> |
152 <tests> | 170 <tests> |
153 <test> | 171 <test> |
154 <param name="reads" value="reads.fa"/> | 172 <conditional name="input"> |
173 <param name="type" value="single"/> | |
174 <param name="reads" value="reads.fa"/> | |
175 </conditional> | |
155 <param name="remove_non_canon" value="True"/> | 176 <param name="remove_non_canon" value="True"/> |
156 <param name="clip" value="true"/> | 177 <param name="clip" value="true"/> |
157 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/> | 178 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/> |
158 <param name="discard_short_reads" value="18"/> | 179 <param name="discard_short_reads" value="18"/> |
159 <param name="collapse_map" value="collapse_and_map"/> | 180 <param name="collapse_map" value="collapse_and_map"/> |
176 <has_line_matching expression="^.*22\t1\t22\ttcaccgggagaaaaactggtgt\tchrII:11534525-11540624\t22\t3382\t3403.*$"/> | 197 <has_line_matching expression="^.*22\t1\t22\ttcaccgggagaaaaactggtgt\tchrII:11534525-11540624\t22\t3382\t3403.*$"/> |
177 <has_line_matching expression="^.*25\t1\t25\ttcaccgggtggaaactagcagtggc\tchrII:11534525-11540624\t25\t3060\t3084.*$"/> | 198 <has_line_matching expression="^.*25\t1\t25\ttcaccgggtggaaactagcagtggc\tchrII:11534525-11540624\t25\t3060\t3084.*$"/> |
178 </assert_contents> | 199 </assert_contents> |
179 </output> | 200 </output> |
180 </test> | 201 </test> |
202 <test> | |
203 <conditional name="input"> | |
204 <param name="type" value="multiple"/> | |
205 <repeat name="reads_list"> | |
206 <param name="sample_name" value="sa1"/> | |
207 <param name="reads" value="reads_sample1.fa"/> | |
208 </repeat> | |
209 <repeat name="reads_list"> | |
210 <param name="sample_name" value="sa2"/> | |
211 <param name="reads" value="reads_sample2.fa"/> | |
212 </repeat> | |
213 </conditional> | |
214 <param name="remove_non_canon" value="True"/> | |
215 <param name="clip" value="true"/> | |
216 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/> | |
217 <param name="discard_short_reads" value="18"/> | |
218 <param name="collapse_map" value="collapse_and_map"/> | |
219 <param name="genomeSource" value="history"/> | |
220 <param name="ownFile" value="cel_cluster.fa"/> | |
221 <output name="output_reads_collapsed"> | |
222 <assert_contents> | |
223 <has_text text=">sa1_220_x1"/> | |
224 <has_text text="TCACCGGGTGTACATCAGC"/> | |
225 <has_text text=">sa2_0_x250"/> | |
226 <has_text text="AATGACACTGGTTATCTTTTCCATCG"/> | |
227 </assert_contents> | |
228 </output> | |
229 <output name="output_mapping"> | |
230 <assert_contents> | |
231 <has_line_matching expression="^.*22\t1\t22\ttcaccgggtggaaactagcagt\tchrII:11534525-11540624\t22\t3060\t3081.*$"/> | |
232 <has_line_matching expression="^.*21\t1\t21\ttcaccgggtggaaactagcag\tchrII:11534525-11540624\t21\t3060\t3080.*$"/> | |
233 <has_line_matching expression="^.*22\t1\t22\ttcaccgggtgtacatcagctaa\tchrII:11534525-11540624\t22\t3631\t3652.*$"/> | |
234 </assert_contents> | |
235 </output> | |
236 </test> | |
181 </tests> | 237 </tests> |
182 <help> | 238 <help> |
183 <![CDATA[ | 239 <![CDATA[ |
184 **What it does** | 240 **What it does** |
185 | 241 |
186 The MiRDeep2 Mapper module is designed as a tool to process deep sequencing reads and/or map them to the reference genome. | 242 The MiRDeep2 Mapper module is designed as a tool to process deep sequencing reads and/or map them to the reference genome. |
187 The module works in sequence space, and can process or map data that is in sequence FASTA format. | 243 The module works in sequence space, and can process or map data that is in sequence FASTA format. |
188 A number of the functions of the mapper module are implemented specifically with Solexa/Illumina data in mind. | 244 A number of the functions of the mapper module are implemented specifically with Solexa/Illumina data in mind. |
189 | 245 |
190 **Input** | 246 **Input** |
191 | 247 |
192 Default input is a file in FASTA format, seq.txt or qseq.txt format. More input can be given depending on the options used. | 248 Default input is a file in FASTA format, seq.txt or qseq.txt format. More input can be given depending on the options used. |
193 | 249 |
194 **Output** | 250 **Output** |
195 | 251 |
196 The output depends on the options used. Either a FASTA file with processed reads or an arf file with with mapped reads, or both, are output. | 252 The output depends on the options used. Either a FASTA file with processed reads or an arf file with with mapped reads, or both, are output. |
197 | 253 |
198 Arf format: | 254 Arf format: |
199 Is a proprietary file format generated and processed by miRDeep2. It contains information of reads mapped to a reference genome. Each line in such a file contains 13 columns: | 255 Is a proprietary file format generated and processed by miRDeep2. It contains information of reads mapped to a reference genome. Each line in such a file contains 13 columns: |
200 | 256 |
201 1. read identifier | 257 1. read identifier |