annotate meme_psp_gen.xml @ 6:73c8585320a9 draft default tip

Uploaded
author greg
date Mon, 21 Aug 2017 10:14:40 -0400
parents e994f439190c
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
1 <tool id="meme_psp_gen" name="MEME psp-gen" version="4.11.2.0">
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
2 <description>- perform discriminative motif discovery</description>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
3 <macros>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
4 <import>macros.xml</import>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
5 </macros>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
6 <expand macro="requirements" />
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
7 <command detect_errors="exit_code"><![CDATA[
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
8 psp-gen
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
9 -pos '$primary_sequence'
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
10 -neg '$control_sequence'
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
11 -minw $adv.minw
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
12 -maxw $adv.maxw
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
13 $adv.alphabet
5
e994f439190c Uploaded
greg
parents: 4
diff changeset
14 #if str($adv.triples_cond.triples) == 'yes':
e994f439190c Uploaded
greg
parents: 4
diff changeset
15 -triples
6
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
16 $adv.triples_cond.fixed_start
5
e994f439190c Uploaded
greg
parents: 4
diff changeset
17 #end if
6
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
18 $adv.equiv
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
19 $adv.consider_both_strands
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
20 $adv.scale_min
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
21 $adv.scale_max
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
22 $adv.max_range
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
23 $adv.raw
5
e994f439190c Uploaded
greg
parents: 4
diff changeset
24 #if str($adv.report_scores_cond.report_scores) == 'yes':
e994f439190c Uploaded
greg
parents: 4
diff changeset
25 -reportscores
6
73c8585320a9 Uploaded
greg
parents: 5
diff changeset
26 $adv.report_scores_cond.verbose
2
c32084cb7fe7 Uploaded
greg
parents: 0
diff changeset
27 2> '$output_tabular'
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
28 #end if
2
c32084cb7fe7 Uploaded
greg
parents: 0
diff changeset
29 > '$output_psp'
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
30 ]]></command>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
31 <inputs>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
32 <param format="fasta" name="primary_sequence" type="data" label="Primary sequence file"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
33 <param format="fasta" name="control_sequence" type="data" label="Control sequence file"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
34 <section name="adv" title="Additional Options">
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
35 <param name="minw" type="integer" value="4" min="0" label="Minimum width to use for position specific priors"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
36 <param name="maxw" type="integer" value="20" min="0" label="Maximum width to use for position specific priors"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
37 <param name="alphabet" type="select" label="Alphabet">
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
38 <option value="-dna" selected="true">DNA</option>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
39 <option value="-protein">protein</option>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
40 <option value="-rna">RNA</option>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
41 </param>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
42 <conditional name="triples_cond">
5
e994f439190c Uploaded
greg
parents: 4
diff changeset
43 <param name="triples" type="select" label="Use spaced triples instead of whole-word matches?" help="Recommended for protein">
e994f439190c Uploaded
greg
parents: 4
diff changeset
44 <option value="no" selected="true">No</option>
e994f439190c Uploaded
greg
parents: 4
diff changeset
45 <option value="yes">yes</option>
e994f439190c Uploaded
greg
parents: 4
diff changeset
46 </param>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
47 <when value="no"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
48 <when value="yes">
4
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
49 <param name="fixed_start" type="boolean" truevalue="-fixedstart" falsevalue="" checked="False" label="Allow triples to start anywhere within a site?" help="Select 'No' to only consider triples starting at the start of the site"/>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
50 </when>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
51 </conditional>
4
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
52 <param name="equiv" type="boolean" truevalue="-equiv" falsevalue="" checked="False" label="Match as equal sequences of letters that appear together?"/>
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
53 <param name="consider_both_strands" type="boolean" truevalue="-revcomp" falsevalue="" checked="False" label="Consider both strands when calculating position specific priors for alphabets?"/>
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
54 <param name="scale_min" type="boolean" truevalue="-scalemin" falsevalue="" checked="False" label="Set the lowest score value after scaling?"/>
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
55 <param name="scale_max" type="boolean" truevalue="-scalemax" falsevalue="" checked="False" label="Set the highest score value after scaling?"/>
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
56 <param name="max_range" type="boolean" truevalue="-maxrange" falsevalue="" checked="False" label="Choose the width with the biggest difference between minimum and maximum scores before scaling?" help="Select 'No' to choose the width with the biggest maximum score (before scaling)"/>
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
57 <param name="raw" type="boolean" truevalue="-raw" falsevalue="" checked="False" label="Output scores instead of priors?"/>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
58 <conditional name="report_scores_cond">
5
e994f439190c Uploaded
greg
parents: 4
diff changeset
59 <param name="report_scores" type="select" label="Output primary and control file names, scores and widths?">
e994f439190c Uploaded
greg
parents: 4
diff changeset
60 <option value="no" selected="true">No</option>
e994f439190c Uploaded
greg
parents: 4
diff changeset
61 <option value="yes">yes</option>
e994f439190c Uploaded
greg
parents: 4
diff changeset
62 </param>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
63 <when value="no"/>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
64 <when value="yes">
4
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
65 <param name="verbose" type="boolean" truevalue="-verbose" falsevalue="" checked="False" label="Report frequency of each score?"/>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
66 </when>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
67 </conditional>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
68 </section>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
69 <param name="non_commercial_use" label="I certify that I am not using this tool for commercial purposes." type="boolean" truevalue="NON_COMMERCIAL_USE" falsevalue="COMMERCIAL_USE" checked="False">
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
70 <validator type="expression" message="This tool is only available for non-commercial use.">value == True</validator>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
71 </param>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
72 </inputs>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
73 <outputs>
2
c32084cb7fe7 Uploaded
greg
parents: 0
diff changeset
74 <data format="memepsp" name="output_psp"/>
c32084cb7fe7 Uploaded
greg
parents: 0
diff changeset
75 <data format="tabular" name="output_tabular" label="${tool.name} (report) on ${on_string}">
3
79df81990900 Uploaded
greg
parents: 2
diff changeset
76 <filter>adv['report_scores_cond']['report_scores'] == 'yes'</filter>
2
c32084cb7fe7 Uploaded
greg
parents: 0
diff changeset
77 </data>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
78 </outputs>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
79 <tests>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
80 <test>
3
79df81990900 Uploaded
greg
parents: 2
diff changeset
81 <param name="primary_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
79df81990900 Uploaded
greg
parents: 2
diff changeset
82 <param name="control_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
79df81990900 Uploaded
greg
parents: 2
diff changeset
83 <param name="alphabet" value="protein"/>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
84 <param name="non_commercial_use" value="True"/>
3
79df81990900 Uploaded
greg
parents: 2
diff changeset
85 <output name="output_psp" file="output.memepsp"/>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
86 </test>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
87 </tests>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
88 <help>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
89
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
90 .. class:: warningmark
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
91
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
92 **WARNING: This tool is only available for non-commercial use. Use for educational, research and non-profit purposes is permitted.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
93 Before using, be sure to review, agree, and comply with the license.**
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
94
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
95 psp-gen is used to allow MEME to perform discriminative motif discovery—to find motifs overrepresented in one set of sequences compared to in another set.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
96 It takes two files as input—the sequence file to be input to MEME, (the "primary" file) and a "control" sequence file of sequences believed not to contain
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
97 the same motifs as in the "primary" file. psp-gen creates a file for use by MEME that encapsulates information about probable discriminative motifs. psp-gen
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
98 records its chosen motif width in the file, and MEME is able to adjust the data when it tries different motif widths.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
99
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
100 .. class:: infomark
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
101
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
102 For detailed information on psp-gen, click here_, or view the license_.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
103
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
104 .. _here: http://meme-suite.org/doc/psp-gen.html?man_type=web
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
105 .. _license: http://meme-suite.org/doc/copyright.html?man_type=web
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
106
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
107 -----
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
108
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
109 **Required options**
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
110
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
111 * **Primary sequence file** - a file containing FASTA formatted sequences which are to be used as the primary set in PSP calculation.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
112 * **Control sequence file** - a file containing FASTA formatted sequences which are to be used as the control set in PSP calculation.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
113
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
114 **Advanced options**
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
115
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
116 * **Minimum width to use for position specific priors** - the minimum width to use with selecting the "best" width for PSPs.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
117 * **Maximum width to use for position specific priors** - the maximum width to use with selecting the "best" width for PSPs.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
118 * **Alphabet** - The alphabet to be used, one of DNA, protein or RNA.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
119 * **Use spaced triples instead of whole-word matches** - use spaced triples instead of whole-word matches (recommended when using the protein alphabet).
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
120
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
121 * **Allow triples to start anywhere within a site** - when using the -triples option, select 'Yes' to only consider triples starting at the start of the site or 'No' to allow triples to start anywhere in a width 'w' site.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
122
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
123 * **Match as equal sequences of letters that appear together** - select 'Yes' to match as equal any sequence of letter that appears together. Separate letter groups using "-" (e.g. -equiv "IVL-HKR") means treat all occurrences of I, V or L as the same, and all occurrences of H, K or R as the same.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
124 * **Consider both strands when calculating position specific priors for alphabets** - select 'Yes' to consider both strands when calculating PSPs for complementable alphabets or 'No to consider only the given strand.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
125 * **Set the lowest score value after scaling** - select 'Yes' to set the lowest score to 0.1 unless the the following "highest score" option is selected, in which case the lowest score is highest score - 1.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
126 * **Set the highest score value after scaling** - select 'Yes' to set the highest score to 0.9 unless the previous "lowest score" option is selected, in which case the highest score is lowest score + 1.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
127 * **Choose the width with the biggest difference between minimum and maximum scores before scaling** - select 'Yes' to choose the width with the biggest difference between minimum and maximum scores before scaling, or 'No' to choose the width with the biggest maximum score before scaling.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
128 * **Output scores instead of priors** - select 'Yes' to output scores instead of position specific priors.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
129 * **Output primary and control file names, scores and widths** - select 'Yes' to produce an additional tabular output consisting of control file names, lowest and highest scores and lowest and highest widths.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
130
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
131 * **Report frequency of each score** - select 'Yes' to include the frequency of each score in the output.
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
132
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
133 </help>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
134 <citations>
4
01d22cb1bccc Uploaded
greg
parents: 3
diff changeset
135 <citation type="doi">10.1186/1471-2105-11-179</citation>
0
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
136 </citations>
e7b8db2b9246 Uploaded
greg
parents:
diff changeset
137 </tool>