|
9
|
1 <tool id="phyml-sms" name="PhyML-SMS" version="1.3.1">
|
|
|
2 <description>Maximum likelihood-based inference of phylogenetic trees with Smart Model Selection</description>
|
|
|
3 <requirements>
|
|
|
4 <requirement type="package" version="1.3">phyml-sms</requirement>
|
|
|
5 </requirements>
|
|
|
6 <command><![CDATA[
|
|
12
|
7
|
|
9
|
8 sms.sh
|
|
|
9 -i $input
|
|
|
10 -o .
|
|
|
11 -p $output_models
|
|
|
12 -t
|
|
12
|
13
|
|
|
14 #if $sequence.seqtype == "cfg"
|
|
|
15 ## Automatic sequence detection
|
|
|
16 ## read an info file to choose which option set
|
|
|
17 #set $info = open( str($input_info) ).read()
|
|
|
18
|
|
|
19 #if 'dna' in $info:
|
|
|
20 -d nt
|
|
|
21 #else if 'protein' in $info :
|
|
|
22 -d aa
|
|
|
23 #else
|
|
|
24 -d $sequence.seqtype
|
|
9
|
25
|
|
|
26 -c $stat_crit
|
|
|
27
|
|
|
28 #if $inpuTree.inputtree == "true" :
|
|
|
29 -u $inpuTree.userInpuTree
|
|
|
30 #end if
|
|
|
31 -s $move
|
|
|
32
|
|
|
33 #if $support_condition.support == "sh":
|
|
|
34 -b -4
|
|
|
35 #else if $support_condition.support == "aBayes":
|
|
|
36 -b -5
|
|
|
37 #else if $support_condition.support == "no":
|
|
|
38 -b 0
|
|
|
39 #else if $support_condition.support == "boot":
|
|
|
40 -b $support_condition.boot_number
|
|
|
41 #end if
|
|
|
42
|
|
|
43 #if $randstart.value != 0 and $move.value == "SPR" :
|
|
|
44 -r $randstart
|
|
|
45 #end if
|
|
|
46 > $output_stdout
|
|
|
47 ;
|
|
|
48 mv *_phyml_tree.txt $output_tree;
|
|
|
49 mv *_phyml_stats.txt $output_stats;
|
|
|
50 ]]>
|
|
|
51 </command>
|
|
|
52 <inputs>
|
|
|
53 <param format="phylip" name="input" type="data" label="Alignment file" help="phylip format"/>
|
|
|
54 <conditional name="sequence">
|
|
|
55 <param name="seqtype" type="select" label="Data type">
|
|
|
56 <option value="nt">Nucleic acids</option>
|
|
|
57 <option value="aa">Amino acids</option>
|
|
12
|
58 <when value="cfg">
|
|
|
59 <param name="input_info" type="data" format="txt" label="info" help="Precompute file containning sequence description (dna or protein)" />
|
|
|
60 </when>
|
|
9
|
61 </param>
|
|
|
62 <when value="nt" />
|
|
|
63 <when value="aa" />
|
|
12
|
64 </conditional>
|
|
9
|
65 <param name="stat_crit" type="select" label="Statistical criterion to select the model">
|
|
|
66 <option value="aic">AIC</option>
|
|
|
67 <option value="bic">BIC</option>
|
|
|
68 </param>
|
|
|
69 <param name="move" type="select" label="Tree topology search" display="radio">
|
|
|
70 <option value="NNI">NNI (Nearest Neighbor Interchange)</option>
|
|
|
71 <option value="SPR">SPR (Subtree Pruning and Regraphing)</option>
|
|
|
72 </param>
|
|
|
73 <conditional name="support_condition">
|
|
|
74 <param type="select" name="support" label="Branch support" help="Use aLRT or aBayes to save computing time">
|
|
|
75 <option value="sh">SH-like aLRT</option>
|
|
|
76 <option value="aBayes">aBayes</option>
|
|
|
77 <option value="boot">Bootstrap</option>
|
|
|
78 <option value="no">No branch support</option>
|
|
|
79 </param>
|
|
|
80 <when value="sh"/>
|
|
|
81 <when value="aBayes"/>
|
|
|
82 <when value="boot">
|
|
|
83 <param type="integer" name="boot_number" min="1" value="100" label="Number of bootstrap replicates" help="Must be a positive integer"/>
|
|
|
84 </when>
|
|
|
85 <when value="no"/>
|
|
|
86 </conditional>
|
|
|
87 <conditional name="inpuTree">
|
|
|
88 <param name="inputtree" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Use input starting tree" />
|
|
|
89 <when value="true">
|
|
|
90 <param name="userInpuTree" type="data" label="Tree file" help="newick format"/>
|
|
|
91 </when>
|
|
|
92 <when value="false"/>
|
|
|
93 </conditional>
|
|
|
94 <param type="integer" name="randstart" value="0" min="0" max="10" label="Number of random starting trees" />
|
|
|
95 </inputs>
|
|
|
96 <outputs>
|
|
|
97 <data format="nhx" name="output_tree" label="PhyML Newick tree"/>
|
|
|
98 <data format="txt" name="output_stats" label="PhyML Statistics"/>
|
|
|
99 <data format="txt" name="output_stdout" label="SMS Best Model"/>
|
|
|
100 <data format="txt" name="output_models" label="SMS compare models"/>
|
|
|
101 </outputs>
|
|
|
102 <tests>
|
|
|
103 <test>
|
|
|
104 <param name="input" value="phylip" />
|
|
|
105 <param name="seqtype" value="nt" />
|
|
|
106 <output name="output_models" file="sms.csv" />
|
|
|
107
|
|
|
108 </test>
|
|
|
109 </tests>
|
|
|
110 <help><![CDATA[
|
|
|
111
|
|
|
112 .. class:: infomark
|
|
|
113
|
|
|
114 This script runs SMS to select the substitution model which best fits the input data.
|
|
|
115 It may also run PhyML with the selected model.
|
|
12
|
116 SMS options :
|
|
9
|
117 -h = Help
|
|
|
118 -i = **Mandatory** Input alignment file in PHYLIP format
|
|
|
119 -d = **Mandatory** Data type : 'aa' or 'nt'
|
|
|
120 -o = Output directory
|
|
|
121 -p = Output CSV filename
|
|
|
122 -c = Statistical criterion to select the model : 'AIC' (default) or 'BIC'
|
|
|
123 -u = Input starting tree (Newick format)
|
|
|
124 -t = Use this option if you want SMS to infer a tree with PhyML using the SMS selected model
|
|
12
|
125 PhyML options :
|
|
9
|
126 -s = Type of tree improvement : 'NNI (default)' or 'SPR'
|
|
|
127 -r = Number of random starting trees : 0 (default)
|
|
|
128 -b = Branch Support : >0 for bootstraps, -4 for aLRT, 0 (default)
|
|
|
129
|
|
|
130 **PhyML 20120412**
|
|
|
131
|
|
|
132 -----
|
|
|
133
|
|
|
134
|
|
|
135 ===========
|
|
|
136 Overview:
|
|
|
137 ===========
|
|
|
138
|
|
|
139 PhyML is a phylogeny software based on the maximum-likelihood principle. Early PhyML versions used a fast algorithm to perform Nearest Neighbor Interchanges (NNIs), in order to improve a reasonable starting tree topology. Since the original publication (Guindon and Gascuel 2003), PhyML has been widely used due to its simplicity and a fair accuracy/speed compromise. In the mean time research around PhyML has continued.
|
|
|
140
|
|
|
141 We designed an efficient algorithm to search the tree space using Subtree Pruning and Regrafting (SPR) topological moves (Hordijk and Gascuel 2005), and proposed a fast branch test based on an approximate likelihood ratio test (Anisimova and Gascuel 2006). However, these novelties were not included in the official version of PhyML, and we found that improvements were still needed in order to make them effective in some practical cases. PhyML 3.0 achieves this task.
|
|
|
142
|
|
|
143 It implements new algorithms to search the space of tree topologies with user-defined intensity. A non-parametric, Shimodaira-Hasegawa-like branch test is also available. The program provides a number of new evolutionary models and its interface was entirely re-designed. We tested PhyML 3.0 on a large collection of real data sets to ensure that the new version is stable, ready-to-use and still reasonably fast and accurate.
|
|
|
144
|
|
|
145 -----
|
|
|
146
|
|
|
147 For further informations, please visite the PhyML_ and SMS_ website.
|
|
|
148
|
|
|
149
|
|
|
150 .. _PhyML: http://www.atgc-montpellier.fr/phyml/
|
|
|
151 .. _SMS: http://www.atgc-montpellier.fr/phyml-sms/
|
|
|
152
|
|
|
153
|
|
|
154 Models References:
|
|
|
155
|
|
|
156 - Dayhoff : Dayhoff, M., Schwartz, R. & Orcutt, B.
|
|
|
157 A model of evolutionary change in proteins.
|
|
|
158 In Dayhoff, M. (ed.) Atlas of Protein Sequence and Structure, vol. 5, 345–352 (National Biomedical Research Foundation, Washington, D. C., 1978)
|
|
|
159
|
|
|
160 - JTT : Jones, D., Taylor, W. & Thornton, J.
|
|
|
161 The rapid generation of mutation data matrices from protein sequences.
|
|
|
162 Computer Applications in the Biosciences (CABIOS) 8, 275–282 (1992).
|
|
|
163
|
|
|
164 - Blosum62 : Henikoff, S. & Henikoff, J.
|
|
|
165 Amino acid substitution matrices from protein blocks.
|
|
|
166 Proceedings of the National Academy of Sciences of the United States of America (PNAS) 89, 10915–10919 (1992).
|
|
|
167
|
|
|
168 - MtREV : Adachi, J. & Hasegawa, M.
|
|
|
169 MOLPHY version 2.3. programs for molecular phylogenetics based on maximum likelihood.
|
|
|
170 In Ishiguro, M. et al. (eds.) Computer Science Monographs, 28 (The Institute of Statistical Mathematics, Tokyo,1996).
|
|
|
171
|
|
|
172 - MtMam : Cao, Y., A. Janke , P. J. Waddell, M. Westerman, O. Takenaka, S. Murata, N. Okada, S. Paabo, and M. Hasegawa
|
|
|
173 Conflict among individual mitochondrial proteins in resolving the phylogeny of eutherian orders.
|
|
|
174 Journal of Molecular Evolution 47, 307–322 (1998).
|
|
|
175
|
|
|
176 - CpREV : Adachi, J., P., W., Martin, W. & Hasegawa, M.
|
|
|
177 Plastid genome phylogeny and a model of amino acid substitution for proteins encoded by chloroplast DNA.
|
|
|
178 Journal of Molecular Evolution 50, 348–358 (2000).
|
|
|
179
|
|
|
180 - VT : Muller, T. & Vingron, M.
|
|
|
181 Modeling amino acid replacement.
|
|
|
182 Journal of Computational Biology 7, 761–776 (2000).
|
|
|
183
|
|
|
184 - WAG : Whelan, S. & Goldman, N.
|
|
|
185 A general empirical model of protein evolution derived from multiple protein families using a maximum-likelihood approach.
|
|
|
186 Molecular Biology and Evolution 18, 691–699 (2001).
|
|
|
187
|
|
|
188 - RtREV : Dimmic, M., Rest, J., Mindell, D. & Goldstein, D.
|
|
|
189 rtREV : an amino acid substitution matrix for inference of retrovirus and reverse transcriptase phylogeny.
|
|
|
190 Journal of Molecular Evolution 55, 65–73 (2002).
|
|
|
191
|
|
|
192 - DCMut : Kosiol, C. & Goldman, N.
|
|
|
193 Different versions of the Dayhoff rate matrix.
|
|
|
194 Molecular Biology and Evolution 22, 193–199 (2004).
|
|
|
195
|
|
|
196 - MtArt : Abascal F, Posada D, Zardoya R.
|
|
|
197 MtArt: a new model of amino acid replacement for Arthropoda.
|
|
|
198 Mol Biol Evol. 2007 Jan;24(1):1-5. Epub 2006 Oct 16.
|
|
|
199
|
|
|
200 - HIVb - HIVw : Nickle DC, Heath L, Jensen MA, Gilbert PB, Mullins JI, Kosakovsky Pond SL.
|
|
|
201 HIV-Specific Probabilistic Models of Protein Evolution.
|
|
|
202 PLoS ONE. 2007 Jun 6;2:e503.
|
|
|
203
|
|
|
204 - LG : Le, S. & Gascuel, O.
|
|
|
205 An improved general amino-acid replacement matrix.
|
|
|
206 Mol. Biol. Evol. 25, 1307–1320 (2008)
|
|
|
207
|
|
|
208 - MtZOA : Rota-Stabelli O, Yang Z, Telford MJ
|
|
|
209 MtZoa: A general mitochondrial amino acid substitutions model for animal evolutionary studies
|
|
|
210 Molecular Phylogenetics and Evolution 52 (2009) 268–272
|
|
|
211
|
|
|
212 - FLU : Cuong Cao Dang, Quang Si Le2, Olivier Gascuel and Vinh Sy Le
|
|
|
213 FLU, an amino acid substitution model for influenza proteins.
|
|
|
214 BMC Evolutionary Biology 2010 Apr 12;10:99
|
|
|
215
|
|
|
216 - AB :
|
|
|
217 Alexander Mirsky,Linda Kazandjian and Maria Anisimova
|
|
|
218 Antibody-specific Model of Amino Acid Substitution for Immunological Inferences from Alignments of Antibody Sequences
|
|
|
219 Mol Biol Evol (2014) doi: 10.1093/molbev/msu340
|
|
|
220 ]]>
|
|
|
221 </help>
|
|
|
222 <citations>
|
|
|
223 <citation type="doi">10.1093/sysbio/syq010</citation>
|
|
|
224 <citation type="doi">10.1093/nar/gki352</citation>
|
|
|
225 <citation type="doi">10.1080/10635150390235520</citation>
|
|
|
226 </citations>
|
|
|
227 </tool>
|