Mercurial > repos > iracooke > protk_proteogenomics
comparison protxml_to_gff.xml @ 0:956bfab63005 draft default tip
planemo upload for repository https://github.com/iracooke/protk-galaxytools/blob/master/protk-proteogenomics/.shed.yml commit 24e0fef2496984648a8a5cd5bff4d6b9b634a302-dirty
author | iracooke |
---|---|
date | Tue, 20 Oct 2015 20:36:03 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:956bfab63005 |
---|---|
1 <tool id="protxml_to_gff" name="Proteomics to GFF" version="1.1.0"> | |
2 <description>Export Proteomics Data to GFF</description> | |
3 <requirements> | |
4 <container type="docker">iracooke/protk-1.4.3</container> | |
5 <requirement type="package" version="1.4.3">protk</requirement> | |
6 <requirement type="package" version="2.2.29">blast+</requirement> | |
7 </requirements> | |
8 <stdio> | |
9 <exit_code range="1:" level="fatal" description="Failure" /> | |
10 </stdio> | |
11 <command> | |
12 protxml_to_gff.rb $protxml_file | |
13 #if $database.source_select=="built_in": | |
14 -d $database.dbkey | |
15 #else | |
16 -d $database.fasta_file | |
17 #end if | |
18 -c $gene_file | |
19 #if str( $gffidpattern ): | |
20 --gff-idregex='$gffidpattern' | |
21 #end if | |
22 | |
23 #if str( $genomeidpattern ): | |
24 --genome-idregex='$genomeidpattern' | |
25 #end if | |
26 | |
27 #if str( $ignorepattern ): | |
28 --ignore-regex='$ignorepattern' | |
29 #end if | |
30 | |
31 --threshold=$peptide_threshold | |
32 --prot-threshold=$prot_threshold | |
33 $stack_charges | |
34 -o $output | |
35 </command> | |
36 <inputs> | |
37 <conditional name="database"> | |
38 <param name="source_select" type="select" label="Database source used for Proteomics Searches" help="Database should be an amino acid fasta file with entry id's that can be parsed to obtain contig or scaffold ids referenced in your gff file"> | |
39 <option value="input_ref">Your Upload File</option> | |
40 <option value="built_in">Built-In</option> | |
41 </param> | |
42 <when value="built_in"> | |
43 <param name="dbkey" type="select" format="text" > | |
44 <label>Database</label> | |
45 <options from_file="pepxml_databases.loc"> | |
46 <column name="name" index="0" /> | |
47 <column name="value" index="2" /> | |
48 </options> | |
49 </param> | |
50 </when> | |
51 <when value="input_ref"> | |
52 <param name="fasta_file" type="data" format="fasta" label="Uploaded FASTA file" /> | |
53 </when> | |
54 </conditional> | |
55 <param name="protxml_file" type="data" format="protxml" multiple="false" label="Proteomics Search Results" help="A ProtXML file produced by Protein Prophet"/> | |
56 <param name="gene_file" type="data" format="gff3" multiple="false" label="Protein coordinates" help="A gff3 file with coordinates for all protein entries used for proteomics searches. Coordinates should correspond to entries in the genome fasta file"/> | |
57 <param name="peptide_threshold" label="Peptide Probability Threshold" type="float" value="0.95" min="0" max="1" help="Only peptides within accepted proteins and passing this threshold will appear in the output"/> | |
58 <param name="prot_threshold" label="Protein Probability Threshold" type="float" value="0.99" min="0" max="1" help="Only peptides within proteins passing this threshold will appear in the output"/> | |
59 <param name="stack_charges" value="false" type="boolean" label="Peptides with different charges get separate gff entries" help="" truevalue="--stack-charge-states" falsevalue="" /> | |
60 <param name="gffidpattern" size="40" type="text" value="lcl\|([^ ]*)" label="gff id regex" help="Regex with capture group for parsing gff ids from protein ids"> | |
61 <sanitizer> | |
62 <valid initial="string.printable"> | |
63 <remove value="'"/> | |
64 </valid> | |
65 <mapping initial="none"> | |
66 <add source="'" target="__sq__"/> | |
67 </mapping> | |
68 </sanitizer> | |
69 </param> | |
70 | |
71 <param name="genomeidpattern" size="40" type="text" label="genome id regex" help="Regex with capture group for parsing genomic ids from protein ids"> | |
72 <sanitizer> | |
73 <valid initial="string.printable"> | |
74 <remove value="'"/> | |
75 </valid> | |
76 <mapping initial="none"> | |
77 <add source="'" target="__sq__"/> | |
78 </mapping> | |
79 </sanitizer> | |
80 </param> | |
81 | |
82 <param name="ignorepattern" size="40" type="text" label="ignore regex" help="Regex to match protein ids that we should ignore completely"> | |
83 <sanitizer> | |
84 <valid initial="string.printable"> | |
85 <remove value="'"/> | |
86 </valid> | |
87 <mapping initial="none"> | |
88 <add source="'" target="__sq__"/> | |
89 </mapping> | |
90 </sanitizer> | |
91 </param> | |
92 | |
93 | |
94 | |
95 </inputs> | |
96 <outputs> | |
97 <data format="gff3" name="output" /> | |
98 </outputs> | |
99 <tests> | |
100 <test> | |
101 <param name="source_select" value="input_ref"/> | |
102 <param name="fasta_file" value="small_prot.fasta" format="fasta"/> | |
103 | |
104 <param name="protxml_file" value="small.prot.xml" format="protxml"/> | |
105 <param name="gene_file" value="small_combined.gff" format="gff3"/> | |
106 <output name="output" format="gff3"> | |
107 <assert_contents> | |
108 <has_text text="polypeptide" /> | |
109 </assert_contents> | |
110 </output> | |
111 </test> | |
112 </tests> | |
113 <help> | |
114 | |
115 **What it does** | |
116 | |
117 Exports peptides and proteins to gff | |
118 | |
119 </help> | |
120 </tool> |