|
0
|
1 <tool id="meme_psp_gen" name="MEME psp-gen" version="4.11.2.0">
|
|
|
2 <description>- perform discriminative motif discovery</description>
|
|
|
3 <macros>
|
|
|
4 <import>macros.xml</import>
|
|
|
5 </macros>
|
|
|
6 <expand macro="requirements" />
|
|
|
7 <command detect_errors="exit_code"><![CDATA[
|
|
|
8 psp-gen
|
|
|
9 -pos '$primary_sequence'
|
|
|
10 -neg '$control_sequence'
|
|
|
11 -minw $adv.minw
|
|
|
12 -maxw $adv.maxw
|
|
|
13 $adv.alphabet
|
|
5
|
14 #if str($adv.triples_cond.triples) == 'yes':
|
|
|
15 -triples
|
|
6
|
16 $adv.triples_cond.fixed_start
|
|
5
|
17 #end if
|
|
6
|
18 $adv.equiv
|
|
|
19 $adv.consider_both_strands
|
|
|
20 $adv.scale_min
|
|
|
21 $adv.scale_max
|
|
|
22 $adv.max_range
|
|
|
23 $adv.raw
|
|
5
|
24 #if str($adv.report_scores_cond.report_scores) == 'yes':
|
|
|
25 -reportscores
|
|
6
|
26 $adv.report_scores_cond.verbose
|
|
2
|
27 2> '$output_tabular'
|
|
0
|
28 #end if
|
|
2
|
29 > '$output_psp'
|
|
0
|
30 ]]></command>
|
|
|
31 <inputs>
|
|
|
32 <param format="fasta" name="primary_sequence" type="data" label="Primary sequence file"/>
|
|
|
33 <param format="fasta" name="control_sequence" type="data" label="Control sequence file"/>
|
|
|
34 <section name="adv" title="Additional Options">
|
|
|
35 <param name="minw" type="integer" value="4" min="0" label="Minimum width to use for position specific priors"/>
|
|
|
36 <param name="maxw" type="integer" value="20" min="0" label="Maximum width to use for position specific priors"/>
|
|
|
37 <param name="alphabet" type="select" label="Alphabet">
|
|
|
38 <option value="-dna" selected="true">DNA</option>
|
|
|
39 <option value="-protein">protein</option>
|
|
|
40 <option value="-rna">RNA</option>
|
|
|
41 </param>
|
|
|
42 <conditional name="triples_cond">
|
|
5
|
43 <param name="triples" type="select" label="Use spaced triples instead of whole-word matches?" help="Recommended for protein">
|
|
|
44 <option value="no" selected="true">No</option>
|
|
|
45 <option value="yes">yes</option>
|
|
|
46 </param>
|
|
0
|
47 <when value="no"/>
|
|
|
48 <when value="yes">
|
|
4
|
49 <param name="fixed_start" type="boolean" truevalue="-fixedstart" falsevalue="" checked="False" label="Allow triples to start anywhere within a site?" help="Select 'No' to only consider triples starting at the start of the site"/>
|
|
0
|
50 </when>
|
|
|
51 </conditional>
|
|
4
|
52 <param name="equiv" type="boolean" truevalue="-equiv" falsevalue="" checked="False" label="Match as equal sequences of letters that appear together?"/>
|
|
|
53 <param name="consider_both_strands" type="boolean" truevalue="-revcomp" falsevalue="" checked="False" label="Consider both strands when calculating position specific priors for alphabets?"/>
|
|
|
54 <param name="scale_min" type="boolean" truevalue="-scalemin" falsevalue="" checked="False" label="Set the lowest score value after scaling?"/>
|
|
|
55 <param name="scale_max" type="boolean" truevalue="-scalemax" falsevalue="" checked="False" label="Set the highest score value after scaling?"/>
|
|
|
56 <param name="max_range" type="boolean" truevalue="-maxrange" falsevalue="" checked="False" label="Choose the width with the biggest difference between minimum and maximum scores before scaling?" help="Select 'No' to choose the width with the biggest maximum score (before scaling)"/>
|
|
|
57 <param name="raw" type="boolean" truevalue="-raw" falsevalue="" checked="False" label="Output scores instead of priors?"/>
|
|
0
|
58 <conditional name="report_scores_cond">
|
|
5
|
59 <param name="report_scores" type="select" label="Output primary and control file names, scores and widths?">
|
|
|
60 <option value="no" selected="true">No</option>
|
|
|
61 <option value="yes">yes</option>
|
|
|
62 </param>
|
|
0
|
63 <when value="no"/>
|
|
|
64 <when value="yes">
|
|
4
|
65 <param name="verbose" type="boolean" truevalue="-verbose" falsevalue="" checked="False" label="Report frequency of each score?"/>
|
|
0
|
66 </when>
|
|
|
67 </conditional>
|
|
|
68 </section>
|
|
|
69 <param name="non_commercial_use" label="I certify that I am not using this tool for commercial purposes." type="boolean" truevalue="NON_COMMERCIAL_USE" falsevalue="COMMERCIAL_USE" checked="False">
|
|
|
70 <validator type="expression" message="This tool is only available for non-commercial use.">value == True</validator>
|
|
|
71 </param>
|
|
|
72 </inputs>
|
|
|
73 <outputs>
|
|
2
|
74 <data format="memepsp" name="output_psp"/>
|
|
|
75 <data format="tabular" name="output_tabular" label="${tool.name} (report) on ${on_string}">
|
|
3
|
76 <filter>adv['report_scores_cond']['report_scores'] == 'yes'</filter>
|
|
2
|
77 </data>
|
|
0
|
78 </outputs>
|
|
|
79 <tests>
|
|
|
80 <test>
|
|
3
|
81 <param name="primary_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
|
|
|
82 <param name="control_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
|
|
|
83 <param name="alphabet" value="protein"/>
|
|
0
|
84 <param name="non_commercial_use" value="True"/>
|
|
3
|
85 <output name="output_psp" file="output.memepsp"/>
|
|
0
|
86 </test>
|
|
|
87 </tests>
|
|
|
88 <help>
|
|
|
89
|
|
|
90 .. class:: warningmark
|
|
|
91
|
|
|
92 **WARNING: This tool is only available for non-commercial use. Use for educational, research and non-profit purposes is permitted.
|
|
|
93 Before using, be sure to review, agree, and comply with the license.**
|
|
|
94
|
|
|
95 psp-gen is used to allow MEME to perform discriminative motif discovery—to find motifs overrepresented in one set of sequences compared to in another set.
|
|
|
96 It takes two files as input—the sequence file to be input to MEME, (the "primary" file) and a "control" sequence file of sequences believed not to contain
|
|
|
97 the same motifs as in the "primary" file. psp-gen creates a file for use by MEME that encapsulates information about probable discriminative motifs. psp-gen
|
|
|
98 records its chosen motif width in the file, and MEME is able to adjust the data when it tries different motif widths.
|
|
|
99
|
|
|
100 .. class:: infomark
|
|
|
101
|
|
|
102 For detailed information on psp-gen, click here_, or view the license_.
|
|
|
103
|
|
|
104 .. _here: http://meme-suite.org/doc/psp-gen.html?man_type=web
|
|
|
105 .. _license: http://meme-suite.org/doc/copyright.html?man_type=web
|
|
|
106
|
|
|
107 -----
|
|
|
108
|
|
|
109 **Required options**
|
|
|
110
|
|
|
111 * **Primary sequence file** - a file containing FASTA formatted sequences which are to be used as the primary set in PSP calculation.
|
|
|
112 * **Control sequence file** - a file containing FASTA formatted sequences which are to be used as the control set in PSP calculation.
|
|
|
113
|
|
|
114 **Advanced options**
|
|
|
115
|
|
|
116 * **Minimum width to use for position specific priors** - the minimum width to use with selecting the "best" width for PSPs.
|
|
|
117 * **Maximum width to use for position specific priors** - the maximum width to use with selecting the "best" width for PSPs.
|
|
|
118 * **Alphabet** - The alphabet to be used, one of DNA, protein or RNA.
|
|
|
119 * **Use spaced triples instead of whole-word matches** - use spaced triples instead of whole-word matches (recommended when using the protein alphabet).
|
|
|
120
|
|
|
121 * **Allow triples to start anywhere within a site** - when using the -triples option, select 'Yes' to only consider triples starting at the start of the site or 'No' to allow triples to start anywhere in a width 'w' site.
|
|
|
122
|
|
|
123 * **Match as equal sequences of letters that appear together** - select 'Yes' to match as equal any sequence of letter that appears together. Separate letter groups using "-" (e.g. -equiv "IVL-HKR") means treat all occurrences of I, V or L as the same, and all occurrences of H, K or R as the same.
|
|
|
124 * **Consider both strands when calculating position specific priors for alphabets** - select 'Yes' to consider both strands when calculating PSPs for complementable alphabets or 'No to consider only the given strand.
|
|
|
125 * **Set the lowest score value after scaling** - select 'Yes' to set the lowest score to 0.1 unless the the following "highest score" option is selected, in which case the lowest score is highest score - 1.
|
|
|
126 * **Set the highest score value after scaling** - select 'Yes' to set the highest score to 0.9 unless the previous "lowest score" option is selected, in which case the highest score is lowest score + 1.
|
|
|
127 * **Choose the width with the biggest difference between minimum and maximum scores before scaling** - select 'Yes' to choose the width with the biggest difference between minimum and maximum scores before scaling, or 'No' to choose the width with the biggest maximum score before scaling.
|
|
|
128 * **Output scores instead of priors** - select 'Yes' to output scores instead of position specific priors.
|
|
|
129 * **Output primary and control file names, scores and widths** - select 'Yes' to produce an additional tabular output consisting of control file names, lowest and highest scores and lowest and highest widths.
|
|
|
130
|
|
|
131 * **Report frequency of each score** - select 'Yes' to include the frequency of each score in the output.
|
|
|
132
|
|
|
133 </help>
|
|
|
134 <citations>
|
|
4
|
135 <citation type="doi">10.1186/1471-2105-11-179</citation>
|
|
0
|
136 </citations>
|
|
|
137 </tool>
|