comparison hyphy_fubar.xml @ 10:da4fd8c3ad0c draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/hyphy/ commit b'446f1cfedd192ab0e7456495383c2099331379cc\n'-dirty
author rdvelazquez
date Mon, 11 Feb 2019 14:17:08 -0500
parents 55dd19bffb00
children 8600d5c4e466
comparison
equal deleted inserted replaced
9:55dd19bffb00 10:da4fd8c3ad0c
1 <?xml version="1.0"?> 1 <?xml version="1.0"?>
2 <tool id="hyphy_fubar" name="HyPhy-FUBAR" version="@VERSION@+galaxy0"> 2 <tool id="hyphy_fubar" name="HyPhy-FUBAR" version="@VERSION@+galaxy0">
3 <description>: Fast Unconstrained Bayesian AppRoximation</description> 3 <description>Fast Unconstrained Bayesian AppRoximation</description>
4 <macros> 4 <macros>
5 <import>macros.xml</import> 5 <import>macros.xml</import>
6 </macros> 6 </macros>
7 <expand macro="requirements" /> 7 <expand macro="requirements" />
8 <version_command>HYPHYMP --version | tail -n 1 | awk '{print $1}'</version_command> 8 <expand macro="version_command" />
9 <command detect_errors="exit_code"> 9 <command detect_errors="exit_code">
10 <![CDATA[ 10 <![CDATA[
11 ln -s '$input_file' fubar_input.fa && 11 ln -s '$input_file' fubar_input.fa &&
12 ln -s '$input_nhx' fubar_input.nhx && 12 ln -s '$input_nhx' fubar_input.nhx &&
13 echo $gencodeid > tool_params && 13 echo $gencodeid > tool_params &&
14 echo `pwd`/fubar_input.fa >> tool_params && 14 echo `pwd`/fubar_input.fa >> tool_params &&
15 echo `pwd`/fubar_input.nhx >> tool_params && 15 echo `pwd`/fubar_input.nhx >> tool_params &&
16 echo '$grid_points' >> tool_params && 16 echo '$grid_points' >> tool_params &&
17 echo '$posterior' >> tool_params &&
17 echo '$mcmc' >> tool_params && 18 echo '$mcmc' >> tool_params &&
18 echo '$chain_length' >> tool_params && 19 echo '$chain_length' >> tool_params &&
19 echo '$samples' >> tool_params && 20 echo '$samples' >> tool_params &&
20 echo '$samples_per_chain' >> tool_params && 21 echo '$samples_per_chain' >> tool_params &&
21 echo '$concentration' >> tool_params && 22 echo '$concentration' >> tool_params &&
22 @HYPHY_INVOCATION@ \$HYPHY_LIB/TemplateBatchFiles/SelectionAnalyses/FUBAR.bf > '$fubar_log' 23 @HYPHY_INVOCATION@ \$HYPHY_LIB/TemplateBatchFiles/SelectionAnalyses/FUBAR.bf > '$fubar_log'
23 ]]> 24 ]]>
24 </command> 25 </command>
25 <inputs> 26 <inputs>
26 <param name="input_file" type="data" format="fasta" label="Input FASTA file" /> 27 <expand macro="inputs" />
27 <param name="input_nhx" type="data" format="nhx" label="Input newick file" /> 28 <expand macro="gencode" />
28 <param name="gencodeid" type="select" label="Genetic code"> 29 <param name="grid_points" type="integer" value="20" min="5" max="50" label="Grid points" />
29 <option value="1">Universal code</option> 30 <param name="posterior" type="select" label="Posterior estimation method">
30 <option value="2">Vertebrate mitochondrial DNA code</option> 31 <option value="1">Full Metropolis-Hastings MCMC algorithm</option>
31 <option value="3">Yeast mitochondrial DNA code</option> 32 <option value="2">Collapsed Gibbs sampler</option>
32 <option value="4">Mold, Protozoan and Coelenterate mt; Mycloplasma/Spiroplasma</option> 33 <option value="3">0-th order Variational Bayes approximations</option>
33 <option value="5">Invertebrate mitochondrial DNA code</option>
34 <option value="6">Ciliate, Dasycladacean and Hexamita Nuclear code</option>
35 <option value="7">Echinoderm mitochondrial DNA code</option>
36 <option value="8">Euplotid Nuclear code</option>
37 <option value="9">Alternative Yeast Nuclear code</option>
38 <option value="10">Ascidian mitochondrial DNA code</option>
39 <option value="11">Flatworm mitochondrial DNA code</option>
40 <option value="12">Blepharisma Nuclear code</option>
41 </param> 34 </param>
42 <param name="grid_points" type="integer" value="20" min="5" max="50" label="Grid points" />
43 <param name="mcmc" type="integer" value="5" min="2" max="20" label="Number of MCMC chains" /> 35 <param name="mcmc" type="integer" value="5" min="2" max="20" label="Number of MCMC chains" />
44 <param name="chain_length" type="integer" value="2000000" min="500000" max="50000000" label="Length of each chain" /> 36 <param name="chain_length" type="integer" value="2000000" min="500000" max="50000000" label="Length of each chain" />
45 <param name="samples" type="integer" value="1000000" min="100000" max="1900000" label="Samples to use for burn-in" /> 37 <param name="samples" type="integer" value="1000000" min="100000" max="1900000" label="Samples to use for burn-in" />
46 <param name="samples_per_chain" type="integer" value="100" min="50" max="1000000" label="Samples to draw from each chain" /> 38 <param name="samples_per_chain" type="integer" value="100" min="50" max="1000000" label="Samples to draw from each chain" />
47 <param name="concentration" type="float" value="0.5" min="0.001" max="1" label="Concentration parameter of the Dirichlet prior" /> 39 <param name="concentration" type="float" value="0.5" min="0.001" max="1" label="Concentration parameter of the Dirichlet prior" />
48 </inputs> 40 </inputs>
49 <outputs> 41 <outputs>
50 <data name="fubar_log" format="txt" /> 42 <data name="fubar_log" format="txt" />
51 <data name="fubar_output" format="json" from_work_dir="fubar_input.fa.FUBAR.json" /> 43 <data name="fubar_output" format="hyphy_json_results" from_work_dir="fubar_input.fa.FUBAR.json" />
52 </outputs> 44 </outputs>
53 <tests> 45 <tests>
54 <test> 46 <test>
55 <param name="input_file" ftype="fasta" value="fubar-in1.fa" /> 47 <param name="input_file" ftype="fasta" value="fubar-in1.fa" />
56 <param name="input_nhx" ftype="nhx" value="fubar-in1.nhx" /> 48 <param name="input_nhx" ftype="nhx" value="fubar-in1.nhx" />
49 <param name="posterior" value="1" />
57 <output name="fubar_output" file="fubar-out1.json" compare="sim_size" /> 50 <output name="fubar_output" file="fubar-out1.json" compare="sim_size" />
58 </test> 51 </test>
59 </tests> 52 </tests>
60 <help> 53 <help>
61 <![CDATA[ 54 <![CDATA[
62 Model-based selection analyses (such as those performed by PAML and HyPhy) can be slow, becoming impractical for large alignments. We present a method to model and detect selection much faster than existing methods and to leverage Bayesian MCMC to robustly account for parameter estimation errors. 55 Model-based selection analyses (such as those performed by PAML and HyPhy) can be slow, becoming impractical for large alignments. We present a method to model and detect selection much faster than existing methods and to leverage Bayesian MCMC to robustly account for parameter estimation errors.
63 56
64 Results: By exploiting some commonly used approximations, FUBAR can perform detection of positive selection under a model that allows rich site- to-site rate variation about 30 to 50 times faster than existing random effects likelihood methods, and 10 to 30 times faster than existing fixed effects likelihood methods. We introduce an ultra-fast MCMC routine that allows a flexible prior specification, with no parametric constraints on the prior shape. Furthermore, our method allows us to visualize Bayesian inference for each site, revealing the model supported by the data. 57 Results: By exploiting some commonly used approximations, FUBAR can perform detection of positive selection under a model that allows rich site- to-site rate variation about 30 to 50 times faster than existing random effects likelihood methods, and 10 to 30 times faster than existing fixed effects likelihood methods. We introduce an ultra-fast MCMC routine that allows a flexible prior specification, with no parametric constraints on the prior shape. Furthermore, our method allows us to visualize Bayesian inference for each site, revealing the model supported by the data.
65 ]]> 58 ]]></help>
66 </help> 59 <expand macro="citations">
67 <expand macro="citations"> 60 <citation type="doi">10.1093/molbev/mst030</citation>
68 <citation type="doi">10.1093/molbev/msu400</citation> 61 </expand>
69 </expand>
70 </tool> 62 </tool>