Mercurial > repos > iuc > evidencemodeler
comparison evidencemodeler.xml @ 0:92d95470befc draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/evidencemodeler commit 982fe890ba21272719fe6f5cb04707c4c91fca0d
| author | iuc |
|---|---|
| date | Sun, 15 Sep 2024 10:12:13 +0000 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:92d95470befc |
|---|---|
| 1 <tool id="evidencemodeler" name="EVidenceModeler" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.05"> | |
| 2 <description>combines ab intio gene predictions, protein and transcript alignments into gene structures</description> | |
| 3 <macros> | |
| 4 <import>macros.xml</import> | |
| 5 </macros> | |
| 6 <xrefs> | |
| 7 <xref type="bio.tools">EvidenceModeler</xref> | |
| 8 </xrefs> | |
| 9 <expand macro="requirements"/> | |
| 10 | |
| 11 <command detect_errors="exit_code"><![CDATA[ | |
| 12 | |
| 13 ln -s '$input_genome' ./input_genome.fasta && | |
| 14 ln -s '$input_predictions' ./input_predictions.gff && | |
| 15 ln -s '$input_weights' ./input_weights.txt && | |
| 16 ln -s '$input_proteins' ./input_proteins.gff && | |
| 17 ln -s '$input_transcript' ./input_transcript.gff && | |
| 18 | |
| 19 EVidenceModeler | |
| 20 --sample_id galaxy | |
| 21 --genome './input_genome.fasta' | |
| 22 --gene_predictions './input_predictions.gff' | |
| 23 --weights './input_weights.txt' | |
| 24 --protein_alignments './input_proteins.gff' | |
| 25 --segmentSize $segmentsize | |
| 26 --overlapSize $overlapsize | |
| 27 | |
| 28 #if $input_transcript: | |
| 29 --transcript_alignments './input_transcript.gff' | |
| 30 #end if | |
| 31 | |
| 32 #if $opt.input_repeat: | |
| 33 --repeats '$opt.input_repeat' | |
| 34 #end if | |
| 35 | |
| 36 #if $opt.input_terminalexon: | |
| 37 --terminalExons '$opt.input_terminalexon' | |
| 38 #end if | |
| 39 | |
| 40 --stop_codons $opt.stop_codon | |
| 41 --min_intron_length $opt.min_intron_length | |
| 42 --search_long_introns $opt.search_long_introns | |
| 43 --re_search_intergenic $opt.re_search_intergenic | |
| 44 --terminal_intergenic_re_search $opt.terminal_intergenic_re_search | |
| 45 | |
| 46 ]]></command> | |
| 47 | |
| 48 <inputs> | |
| 49 <param name="input_genome" type="data" format="fasta" label="Genome input"/> | |
| 50 <param name="input_predictions" type="data" format="gff3" label="Gene predictions input"/> | |
| 51 <param name="input_weights" type="data" format="gff3" label="Weights for evidence types file" help="See documentation for formatting: 'Weights' section"/> | |
| 52 <param name="input_proteins" type="data" format="gff3" label="Protein alignments input" help="Optional but recommended"/> | |
| 53 <param name="input_transcript" type="data" optional="true" format="gff3" label="Transcript alignments input" help="Optional but recommended"/> | |
| 54 <param argument="--segmentSize" name="segmentsize" value="100000" type="integer" label="Length of a single sequence" help="This value must be less than 1 MB" /> | |
| 55 <param argument="--overlapSize" name="overlapsize" value="10000" type="integer" label="Length of sequence overlap between segmented sequences" help="The length must be at least equivalent to one or two expected gene lengths" /> | |
| 56 <section name="opt" title="Advanced option" expanded="false"> | |
| 57 <param name="input_repeat" type="data" optional="true" format="gff3" label="Masked genome repeats"/> | |
| 58 <param name="input_terminalexon" type="data" optional="true" format="gff3" label="Additional file of terminal exons to be taken into account" help="From long-orfs PASA"/> | |
| 59 <param name="stop_codon" argument="--stop_codons" type="select" multiple="true" optional="true" label="List of stop codon" help="For Tetrahymena, set TGA"> | |
| 60 <option value="TAA,TGA,TAG" selected="true">TAA,TGA,TAG</option> | |
| 61 <option value="TAA">TAA</option> | |
| 62 <option value="TGA">TGA</option> | |
| 63 <option value="TAG">TAG</option> | |
| 64 </param> | |
| 65 <param argument="--min_intron_length" type="integer" value="20" label="Minimum length for an intron" help="Default 20 bp" /> | |
| 66 <param argument="--search_long_introns" type="select" label="Reexamine long introns" help="Can find nested genes, but also can result in false positives"> | |
| 67 <option value="0" selected="true">Off</option> | |
| 68 <option value="1">On</option> | |
| 69 </param> | |
| 70 <param argument="--re_search_intergenic" type="select" label="Reexamines intergenic regions of minimum length"> | |
| 71 <option value="0" selected="true">Off</option> | |
| 72 <option value="1">On</option> | |
| 73 </param> | |
| 74 <param argument="--terminal_intergenic_re_search" type="select" label="Reexamines intergenic regions of minimum length"> | |
| 75 <option value="0" selected="true">Off</option> | |
| 76 <option value="1">On</option> | |
| 77 </param> | |
| 78 </section> | |
| 79 </inputs> | |
| 80 | |
| 81 <outputs> | |
| 82 <data name='evm_gff' format='gff' label="${tool.name} on ${on_string}: GFF3" from_work_dir="galaxy.EVM.gff3"/> | |
| 83 <data name='evm_pep' format='fasta' label="${tool.name} on ${on_string}: PEP" from_work_dir="galaxy.EVM.pep"/> | |
| 84 </outputs> | |
| 85 | |
| 86 <tests> | |
| 87 <test expect_num_outputs="2"> | |
| 88 <param name="input_genome" value="genome.fasta"/> | |
| 89 <param name="input_predictions" value="gene_predictions.gff3"/> | |
| 90 <param name="input_weights" value="weights.txt"/> | |
| 91 <param name="input_proteins" value="protein_alignments.gff3"/> | |
| 92 <param name="input_transcript" value="transcript_alignments.gff3"/> | |
| 93 <param name="segmentsize" value="100000"/> | |
| 94 <param name="overlapsize" value="10000"/> | |
| 95 <conditional name="opt"> | |
| 96 <param name="adv" value="true"/> | |
| 97 <param name="min_intron_length" value="20"/> | |
| 98 <param name="search_long_introns" value="0"/> | |
| 99 <param name="re_search_intergenic" value="0"/> | |
| 100 <param name="terminal_intergenic_re_search" value="0"/> | |
| 101 </conditional> | |
| 102 <output name="evm_pep" ftype="fasta"> | |
| 103 <assert_contents> | |
| 104 <has_text text="evm.model.Contig1.3 evm.TU.Contig1.3 EVM prediction Contig1.3 Contig1:7611-9749(-)"/> | |
| 105 <has_text text="evm.model.Contig1.10 evm.TU.Contig1.10 EVM prediction Contig1.10 Contig1:57371-59941(+)"/> | |
| 106 <has_n_lines n="108" delta="0"/> | |
| 107 <has_n_columns n="1" delta="0"/> | |
| 108 </assert_contents> | |
| 109 </output> | |
| 110 <output name="evm_gff" ftype="gff"> | |
| 111 <assert_contents> | |
| 112 <has_text text="ID=evm.TU.Contig1.1;Name=EVM%20prediction%20Contig1.1"/> | |
| 113 <has_text text="ID=evm.TU.Contig1.4;Name=EVM%20prediction%20Contig1.4"/> | |
| 114 <has_n_lines n="191" delta="0"/> | |
| 115 <has_n_columns n="9" delta="0"/> | |
| 116 <!-- the sep=";" is used to count the gff properties --> | |
| 117 <has_n_columns n="2" delta="0" sep=";"/> | |
| 118 </assert_contents> | |
| 119 </output> | |
| 120 </test> | |
| 121 </tests> | |
| 122 | |
| 123 <help><![CDATA[ | |
| 124 EvidenceModeler_: EVidenceModeler (aka EVM) is a software package that combines ab intio | |
| 125 gene predictions and protein and transcript alignments into weighted consensus gene structures. | |
| 126 EVM provides a flexible and intuitive framework for combining various types of evidence into a | |
| 127 single automated gene structure annotation system. | |
| 128 | |
| 129 .. _EvidenceModeler: https://github.com/EVidenceModeler/EVidenceModeler.github.io | |
| 130 ]]></help> | |
| 131 <expand macro="citation"></expand> | |
| 132 </tool> |
