0
|
1 <tool id="plant_tribes_gene_family_phylogeny_builder" name="GeneFamilyPhylogenyBuilder" version="@WRAPPER_VERSION@.0">
|
6
|
2 <description>builds phylogenetic trees of aligned orthologous gene family clusters</description>
|
0
|
3 <macros>
|
|
4 <import>macros.xml</import>
|
|
5 </macros>
|
|
6 <expand macro="requirements_gene_family_phylogeny_builder" />
|
13
|
7 <command detect_errors="exit_code">
|
0
|
8 <![CDATA[
|
|
9 #set input_format = $input_format_cond.input_format
|
|
10 #set tree_inference = $tree_inference_cond.tree_inference
|
|
11 #if str($tree_inference) == 'raxml':
|
|
12 #set rooting_order_file_cond = $tree_inference_cond.rooting_order_file_cond
|
|
13 #set rooting_order_file = $rooting_order_file_cond.rooting_order_file
|
|
14 #if str($rooting_order_file) == 'yes':
|
|
15 #set rooting_order = $rooting_order_file_cond.rooting_order
|
|
16 #end if
|
|
17 #set bootstrap_replicates = $tree_inference_cond.bootstrap_replicates
|
|
18 #end if
|
|
19
|
|
20 python $__tool_directory__/gene_family_phylogeny_builder.py
|
4
|
21 #if str($input_format) == 'ptalign':
|
|
22 --orthogroup_aln '$input_format_cond.input_ptalign.extra_files_path'
|
|
23 --alignment_type 'aln'
|
|
24 --sequence_type 'protein'
|
|
25 #else if str($input_format) == 'ptalignca':
|
|
26 --orthogroup_aln '$input_format_cond.input_ptalignca.extra_files_path'
|
|
27 --alignment_type 'aln'
|
|
28 --sequence_type $input_format_cond.sequence_type
|
|
29 #else if str($input_format) == 'ptalignfiltered':
|
|
30 --orthogroup_aln '$input_format_cond.input_ptalignfiltered.extra_files_path'
|
|
31 --alignment_type 'filter'
|
|
32 --sequence_type 'protein'
|
|
33 #else if str($input_format) == 'ptalignfilteredca':
|
|
34 --orthogroup_aln '$input_format_cond.input_ptalignfilteredca.extra_files_path'
|
|
35 --alignment_type 'filter'
|
|
36 --sequence_type $input_format_cond.sequence_type
|
|
37 #else if str($input_format) == 'ptaligntrimmed':
|
|
38 --orthogroup_aln '$input_format_cond.input_ptaligntrimmed.extra_files_path'
|
|
39 --alignment_type 'trim'
|
|
40 --sequence_type 'protein'
|
|
41 #else if str($input_format) == 'ptaligntrimmedca':
|
|
42 --orthogroup_aln '$input_format_cond.input_ptaligntrimmedca.extra_files_path'
|
|
43 --alignment_type 'trim'
|
|
44 --sequence_type $input_format_cond.sequence_type
|
|
45 #end if
|
0
|
46 --scaffold '$scaffold.fields.path'
|
|
47 --config_dir '$scaffold.fields.path'
|
|
48 --method $method
|
|
49 --tree_inference $tree_inference
|
|
50 #if str($tree_inference) == 'raxml':
|
|
51 #if str($rooting_order_file) == 'yes':
|
|
52 --rooting_order '$rooting_order'
|
|
53 ## No else block needed here because the default rooting_order
|
|
54 ## configuration will be used if the --rooting_order flag is missing.
|
|
55 #end if
|
|
56 --bootstrap_replicates $bootstrap_replicates
|
25
|
57 --output_phylip '$output_phylip'
|
|
58 --output_phylip_dir '$output_phylip.files_path'
|
0
|
59 #end if
|
|
60 --min_orthogroup_size $min_orthogroup_size
|
|
61 --max_orthogroup_size $max_orthogroup_size
|
|
62 --num_threads \${GALAXY_SLOTS:-4}
|
29
|
63 #set output_pttree_dir = output_pttree_dir_cond.output_pttree_dir
|
|
64 #if str($output_pttree_dir) == 'yes':
|
|
65 --output_tree '$output_tree'
|
|
66 --output_tree_dir '$output_tree.files_path'
|
|
67 #end if
|
0
|
68 ]]>
|
|
69 </command>
|
|
70 <inputs>
|
|
71 <conditional name="input_format_cond">
|
6
|
72 <param name="input_format" type="select" label="Orthogroup alignments">
|
|
73 <option value="ptalign">Proteins orthogroup alignments</option>
|
|
74 <option value="ptalignca">Protein and coding sequences orthogroup alignments</option>
|
|
75 <option value="ptalignfiltered">Filtered proteins orthogroup alignments</option>
|
|
76 <option value="ptalignfilteredca">Filtered protein and coding sequences orthogroup alignments</option>
|
|
77 <option value="ptaligntrimmed">Trimmed proteins orthogroup alignments</option>
|
|
78 <option value="ptaligntrimmedca">Trimmed protein and coding sequences orthogroup alignments</option>
|
0
|
79 </param>
|
|
80 <when value="ptalign">
|
6
|
81 <param name="input_ptalign" format="ptalign" type="data" label="Proteins orthogroup alignments">
|
10
|
82 <validator type="empty_extra_files_path" />
|
0
|
83 </param>
|
|
84 </when>
|
|
85 <when value="ptalignca">
|
6
|
86 <param name="input_ptalignca" format="ptalignca" type="data" label="Protein and coding sequences orthogroup alignments">
|
10
|
87 <validator type="empty_extra_files_path" />
|
0
|
88 </param>
|
|
89 <expand macro="param_sequence_type" />
|
|
90 </when>
|
|
91 <when value="ptalignfiltered">
|
6
|
92 <param name="input_ptalignfiltered" format="ptalignfiltered" type="data" label="Filtered proteins orthogroup alignments">
|
10
|
93 <validator type="empty_extra_files_path" />
|
0
|
94 </param>
|
|
95 </when>
|
|
96 <when value="ptalignfilteredca">
|
6
|
97 <param name="input_ptalignfilteredca" format="ptalignfilteredca" type="data" label="Filtered protein and coding sequences orthogroup alignments">
|
10
|
98 <validator type="empty_extra_files_path" />
|
0
|
99 </param>
|
|
100 <expand macro="param_sequence_type" />
|
|
101 </when>
|
|
102 <when value="ptaligntrimmed">
|
6
|
103 <param name="input_ptaligntrimmed" format="ptaligntrimmed" type="data" label="Trimmed proteins orthogroup alignments">
|
10
|
104 <validator type="empty_extra_files_path" />
|
0
|
105 </param>
|
|
106 </when>
|
|
107 <when value="ptaligntrimmedca">
|
6
|
108 <param name="input_ptaligntrimmedca" format="ptaligntrimmedca" type="data" label="Trimmed protein and coding sequences orthogroup alignments">
|
10
|
109 <validator type="empty_extra_files_path" />
|
0
|
110 </param>
|
|
111 <expand macro="param_sequence_type" />
|
|
112 </when>
|
|
113 </conditional>
|
|
114 <expand macro="param_scaffold" />
|
|
115 <expand macro="param_method" />
|
|
116 <conditional name="tree_inference_cond">
|
6
|
117 <param name="tree_inference" type="select" label="Phylogenetic inference method">
|
0
|
118 <option value="raxml" selected="true">RAxML</option>
|
|
119 <option value="fasttree">FastTree</option>
|
|
120 </param>
|
|
121 <when value="raxml">
|
|
122 <conditional name="rooting_order_file_cond">
|
7
|
123 <param name="rooting_order_file" type="select" label="Rooting order configuration">
|
0
|
124 <option value="no" selected="true">No</option>
|
|
125 <option value="yes">Yes</option>
|
|
126 </param>
|
|
127 <when value="no" />
|
|
128 <when value="yes">
|
11
|
129 <param name="rooting_order" format="txt" type="data" label="Rooting order configuration" />
|
0
|
130 </when>
|
|
131 </conditional>
|
6
|
132 <param name="bootstrap_replicates" type="integer" value="100" min="0" label="Bootstrap replicates" />
|
0
|
133 </when>
|
|
134 <when value="fasttree" />
|
|
135 </conditional>
|
27
|
136 <param name="max_orthogroup_size" type="integer" value="100" min="4" label="Maximum orthogroup size" />
|
|
137 <param name="min_orthogroup_size" type="integer" value="4" min="4" label="Minimum orthogroup size" />
|
29
|
138 <conditional name="output_pttree_dir_cond">
|
|
139 <param name="output_pttree_dir" type="select" label="Output additional directory of phylogenetic tree files?">
|
|
140 <option value="no" selected="true">No</option>
|
|
141 <option value="yes">Yes</option>
|
|
142 </param>
|
|
143 <when value="no" />
|
|
144 <when value="yes" />
|
|
145 </conditional>
|
0
|
146 </inputs>
|
|
147 <outputs>
|
29
|
148 <collection name="tree" type="list" label="GeneFamilyPhylogenyBuilder phylogenetic trees (dataset collection) on ${on_string}">
|
|
149 <discover_datasets pattern="__name__" directory="geneFamilyPhylogenies_dir/orthogroups_tree" format="nhx" />
|
|
150 </collection>
|
|
151 <data name="output_tree" format="pttree" label="GeneFamilyPhylogenyBuilder phylogenetic trees (directory) on ${on_string}">
|
|
152 <filter>output_pttree_dir_cond['output_pttree_dir'] == 'yes'</filter>
|
|
153 </data>
|
26
|
154 <data name="output_phylip" format="ptphylip" label="GeneFamilyPhylogenyBuilder orthogroup phylip multiple sequence alignments on ${on_string}">
|
25
|
155 <filter>tree_inference_cond['tree_inference'] == 'raxml'</filter>
|
|
156 </data>
|
0
|
157 </outputs>
|
|
158 <tests>
|
|
159 <test>
|
|
160 </test>
|
|
161 </tests>
|
|
162 <help>
|
6
|
163 This tool is one of the PlantTribes collection of automated modular analysis pipelines for comparative and evolutionary
|
|
164 analyses of genome-scale gene families and transcriptomes. This tool performs gene family phylogenetic inference of
|
|
165 multiple sequence alignments produced by the GeneFamilyAligner tool.
|
0
|
166
|
|
167 -----
|
|
168
|
|
169 **Required options**
|
|
170
|
6
|
171 * **Orthogroup alignments** - orthogroup alignment fasta files produced by the GeneFamilyAligner tool selected from your history. Depending on how the GeneFamilyAligner tool was executed, these could either be pre-processed alignments, trimmed alignments or both trimmed and filtered alignments.
|
|
172 * **Gene family scaffold** - one of the PlantTribes gene family scaffolds installed into Galaxy by the PlantTribes Scaffold Download Data Manager tool.
|
11
|
173 * **Protein clustering method** - gene family scaffold protein clustering method as described in the AssemblyPostProcessor tool.
|
6
|
174 * **Phylogenetic inference method** - method for estimating orthogroup maximum likelihood (ML) phylogenetic trees. PlantTribes estimates ML phylogenetic trees using either RAxML or FastTree algorithms.
|
|
175
|
0
|
176 **Other options**
|
|
177
|
7
|
178 * **Rooting order configuration** - select 'Yes' to enable selection of a rooting order configuration file for RAxML. Scaffold configuration templates (.rootingOrder.config) of how to customize the RAxML ML tree rooting order can be found in the scaffold data installed into Galaxy via the PlantTribes Scaffolds Download Data Manager tool, and is also available at the PlantTribes GitHub `repository`_. Phylogenetic tree rooting order settings shown in these templates are used as defaults if 'No' is selected.
|
6
|
179 * **Bootstrap replicates** - number of bootstrap replicates for RAxML to conduct a rapid bootstrap analysis and search for the best-scoring ML tree (default = 100).
|
11
|
180 * **Maximum orthogroup size** - maximum number of sequences allowed in orthogroup alignments (default = 100).
|
|
181 * **Minimum orthogroup size** - minimum number of sequences allowed in orthogroup alignments (default = 4).
|
6
|
182
|
9
|
183 .. _repository: https://github.com/dePamphilis/PlantTribes/tree/master/config
|
|
184
|
0
|
185 </help>
|
|
186 <citations>
|
|
187 <expand macro="citation1" />
|
6
|
188 <citation type="bibtex">
|
|
189 @article{Wall2008,
|
|
190 journal = {Nucleic Acids Research},
|
|
191 author = {2. Wall PK, Leebens-Mack J, Muller KF, Field D, Altman NS},
|
|
192 title = {PlantTribes: a gene and gene family resource for comparative genomics in plants},
|
|
193 year = {2008},
|
|
194 volume = {36},
|
|
195 number = {suppl 1},
|
|
196 pages = {D970-D976},}
|
|
197 </citation>
|
|
198 <citation type="bibtex">
|
|
199 @article{Sasidharan2012,
|
|
200 journal = {Nucleic Acids Research},
|
|
201 author = {3. Sasidharan R, Nepusz T, Swarbreck D, Huala E, Paccanaro A},
|
|
202 title = {GFam: a platform for automatic annotation of gene families},
|
|
203 year = {2012},
|
|
204 pages = {gks631},}
|
|
205 </citation>
|
|
206 <citation type="bibtex">
|
|
207 @article{Li2003,
|
|
208 journal = {Genome Research}
|
|
209 author = {4. Li L, Stoeckert CJ, Roos DS},
|
|
210 title = {OrthoMCL: identification of ortholog groups for eukaryotic genomes},
|
|
211 year = {2003},
|
|
212 volume = {13},
|
|
213 number = {9},
|
|
214 pages = {2178-2189},}
|
|
215 </citation>
|
|
216 <citation type="bibtex">
|
|
217 @article{Emms2015,
|
|
218 journal = {Genome Biology}
|
|
219 author = {5. Emms DM, Kelly S},
|
|
220 title = {OrthoFinder: solving fundamental biases in whole genome comparisons dramatically improves orthogroup inference accuracy},
|
|
221 year = {2015},
|
|
222 volume = {16},
|
|
223 number = {1},
|
|
224 pages = {157},}
|
|
225 </citation>
|
|
226 <citation type="bibtex">
|
|
227 @article{Stamatakis2014,
|
|
228 journal = {Bioinformatics},
|
|
229 author = {6. Stamatakis A},
|
|
230 title = {RAxML Version 8: A tool for Phylogenetic Analysis and Post-Analysis of Large Phylogenies},
|
|
231 year = {2014},
|
|
232 url = {http://sco.h-its.org/exelixis/web/software/raxml/index.html},}
|
|
233 </citation>
|
|
234 <citation type="bibtex">
|
|
235 @article{Price2010,
|
|
236 journal = {PLoS one},
|
|
237 author = {7. Price MN, Dehal PS, Arkin AP},
|
|
238 title = {FastTree 2-approximately maximim-likelihood trees for large alignments},
|
|
239 year = {2010},
|
|
240 volume = {5},
|
|
241 number = {3},
|
|
242 pages = {e9490},}
|
|
243 </citation>
|
0
|
244 </citations>
|
|
245 </tool>
|