|
0
|
1 <tool id="ucsc_blat" name="UCSC BLAT Alignment Tool" version="1.0">
|
|
|
2 <description>Rapidly align sequences to the genome</description>
|
|
|
3 <requirements>
|
|
|
4 <requirement type="package" version="1.0">ucsc_tools_340_for_BLAT</requirement>
|
|
|
5 </requirements>
|
|
|
6 <command detect_errors="exit_code"><![CDATA[
|
|
|
7 blat
|
|
|
8 #if $noHead
|
|
|
9 -noHead
|
|
|
10 #end if
|
|
|
11 -q=$query_type
|
|
|
12 -t=$database_type
|
|
|
13 -mask=$mask
|
|
|
14 '${database}'
|
|
|
15 '${query}'
|
|
|
16 '${output}'
|
|
|
17
|
|
|
18 ]]></command>
|
|
|
19 <inputs>
|
|
|
20 <param type="data" name="database" format="fasta" />
|
|
|
21 <param type="data" name="query" format="fasta" />
|
|
|
22 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dna">
|
|
|
23 <option value="dna">DNA sequence</option>
|
|
|
24 <option value="prot">protein sequence</option>
|
|
|
25 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
26 </param>
|
|
|
27 <param type="select" name="query_type" format="text" multiple="false" label="query type" help="Choose your query type, the default is dna">
|
|
|
28 <option value="dna">DNA sequence</option>
|
|
|
29 <option value="rna">RNA sequence</option>
|
|
|
30 <option value="prot">protein sequence</option>
|
|
|
31 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
32 <option value="rnax">DNA sequence translated in three frames to protein</option>
|
|
|
33 </param>
|
|
|
34 <param name="noHead" type="boolean" value="false" label="Suppresses .psl header (so it's just a tab-separated file)." />
|
|
|
35 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region
|
|
|
36 but may extend through it in nucleotide searches. Masked areas
|
|
|
37 are ignored entirely in protein or translated searches.">
|
|
|
38 <option value="lower">lower - mask out lower-cased sequence</option>
|
|
|
39 <option value="upper">upper - mask out upper-cased sequence</option>
|
|
|
40 <option value="out">out - mask according to database.out RepeatMasker .out file</option>
|
|
|
41 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option>
|
|
|
42 </param>
|
|
|
43 <!--<conditional name="database" format="fasta">
|
|
|
44 <param type="select" name="database_type" format="text" multiple="false" label="database type" help="Choose your database type, the default is dna">
|
|
|
45 <option value="dna">DNA sequence</option>
|
|
|
46 <option value="prot">protein sequence</option>
|
|
|
47 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
48 </param>
|
|
|
49 <when value="dna">
|
|
|
50 <param type="integer" name="tileSize" value="11" min="1" max="12" label="tileSize" help="Sets the size of match that triggers an alignment. Usually between 8 and 12">tileSize</param>
|
|
|
51 <param name="minMatch" type="integer" value="2" label="Sets the number of tile matches. Usually set from 2 to 4.
|
|
|
52 Default is 2 for nucleotide, 1 for protein.">-minMatch</param>
|
|
|
53 <param name="minIdentity" type="integer" value="90" label="Sets minimum sequence identity (in percent). Default is
|
|
|
54 90 for nucleotide searches, 25 for protein or translated
|
|
|
55 protein searches.">-minIdentity</param>
|
|
|
56
|
|
|
57 </when>
|
|
|
58 <when value="prot">
|
|
|
59 <param type="integer" name="tileSize" value="5" min="1" max="12" label="tileSize" help="Sets the size of match that triggers an alignment. Usually between 8 and 12">tileSize</param>
|
|
|
60 <param name="minMatch" type="integer" value="1" label="Sets the number of tile matches. Usually set from 2 to 4.
|
|
|
61 Default is 2 for nucleotide, 1 for protein.">-minMatch</param>
|
|
|
62 <param name="minIdentity" type="integer" value="25" label="Sets minimum sequence identity (in percent). Default is
|
|
|
63 90 for nucleotide searches, 25 for protein or translated
|
|
|
64 protein searches.">-minIdentity</param>
|
|
|
65 </when>
|
|
|
66 </conditional>
|
|
|
67 <param type="select" name="query_type" format="text" multiple="false" label="query type" help="Choose your query type, the default is dna">
|
|
|
68 <option value="dna">DNA sequence</option>
|
|
|
69 <option value="rna">RNA sequence</option>
|
|
|
70 <option value="prot">protein sequence</option>
|
|
|
71 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
72 <option value="rnax">DNA sequence translated in three frames to protein</option>
|
|
|
73 </param>
|
|
|
74 <conditional name="settings">
|
|
|
75 <param name="advanced" type="select" multiple="false" label="Specify advanced parameters">
|
|
|
76 <option value="simple" selected="true">No, use program defaults. </option>
|
|
|
77 <option value="advanced">Yes, see full parameter list.</option>
|
|
|
78 </param>
|
|
|
79 <when value="advanced">
|
|
|
80 <param name="mask" type="select" label="Mask out repeats" help="Alignments won't be started in masked region
|
|
|
81 but may extend through it in nucleotide searches. Masked areas
|
|
|
82 are ignored entirely in protein or translated searches.">
|
|
|
83 <option value="lower">lower - mask out lower-cased sequence</option>
|
|
|
84 <option value="upper">upper - mask out upper-cased sequence</option>
|
|
|
85 <option value="out">out - mask according to database.out RepeatMasker .out file</option>
|
|
|
86 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option>
|
|
|
87 </param>
|
|
|
88 <param name="qmask" type="select" label="Mask out repeats in query sequence" help="Similar to -mask above, but
|
|
|
89 for query rather than target sequence.">
|
|
|
90 <option value="lower">lower - mask out lower-cased sequence</option>
|
|
|
91 <option value="upper">upper - mask out upper-cased sequence</option>
|
|
|
92 <option value="out">out - mask according to database.out RepeatMasker .out file</option>
|
|
|
93 <option value="file.out">file.out - mask database according to RepeatMasker file.out</option>
|
|
|
94 </param>
|
|
|
95 <param name="oneOff" type="integer" value="0" label="If set to 1, this allows one mismatch in tile and still triggers an alignment. Default is 0.">-oneOff</param>
|
|
|
96 <param name="minScore" type="integer" value="30" label="Sets minimum score. This is the matches minus the
|
|
|
97 mismatches minus some sort of gap penalty. Default is 30.">-minScore</param>
|
|
|
98 <param name="maxGap" type="integer" value="2" label="Sets the size of maximum gap between tiles in a clump. Usually
|
|
|
99 set from 0 to 3. Default is 2. Only relevent for minMatch > 1.">-maxGap</param>
|
|
|
100 <param name="minRepDivergence" type="integer" value="15" min="0" max="100" label="Minimum percent divergence of repeats to allow
|
|
|
101 them to be unmasked. Default is 15. Only relevant for
|
|
|
102 masking using RepeatMasker .out files.">-minRepDivergence</param>
|
|
|
103 <param name="noHead" type="boolean" value="false" label="Suppresses .psl header (so it's just a tab-separated file)." />
|
|
|
104 <param name="dots" type="integer" value="0" label="Output dot every N sequences to show program's progress." />
|
|
|
105 <param name="trimT" type="boolean" value="false" label="Trim leading poly-T." />
|
|
|
106 <param name="trimHardA" type="boolean" value="false" label="Remove poly-A tail from qSize as well as alignments in
|
|
|
107 psl output." />
|
|
|
108 <param name="fastMap" type="boolean" value="false" label="Run for fast DNA/DNA remapping - not allowing introns,
|
|
|
109 requiring high %ID. Query sizes must not exceed 5000." />
|
|
|
110 <param name="fine" type="boolean" value="false" label="For high-quality mRNAs, look harder for small initial and
|
|
|
111 terminal exons. Not recommended for ESTs." />
|
|
|
112 <param name="out" type="select" label="Output file format">
|
|
|
113 <option value="psl" selected="true">psl - Default. Tab-separated format, no sequence</option>
|
|
|
114 <option value="pslx">pslx - Tab-separated format with sequence</option>
|
|
|
115 <option value="axt">axt - blastz-associated axt format</option>
|
|
|
116 <option value="maf">maf - multiz-associated maf format</option>
|
|
|
117 <option value="sim4">sim4 - similar to sim4 format</option>
|
|
|
118 <option value="wublast">wublast - similar to wublast format</option>
|
|
|
119 <option value="blast">blast - similar to NCBI blast format</option>
|
|
|
120 <option value="blast8">blast8- NCBI blast tabular format</option>
|
|
|
121 <option value="blast9">blast9 - NCBI blast tabular format with comments</option>
|
|
|
122 </param>
|
|
|
123 <param name="maxIntro" type="integer" value="750000" label="Sets maximum intron size. Default is 750000." />
|
|
|
124 <param name="extendThroughN" type="boolean" value="false" label="Allows extension of alignment through large blocks of Ns." />
|
|
|
125 </when>
|
|
|
126 </conditional>-->
|
|
|
127 </inputs>
|
|
|
128 <outputs>
|
|
|
129 <data format="psl" name="output"></data>
|
|
|
130 </outputs>
|
|
|
131 <tests>
|
|
|
132 <test>
|
|
|
133 <param name="database" value="amaVit1.fa" />
|
|
|
134 <param name="query" value="Gallus_gallus_RefSeq.fa" />
|
|
|
135 <param name="database_type" value="dnax" />
|
|
|
136 <param name="query_type" value="rnax" />
|
|
|
137 <param name="noHead" value="true" />
|
|
|
138 <param name="mask" value="lower" />
|
|
|
139 <output name="output" value="amaVit1_Gallus_gallus.psl" />
|
|
|
140 </test>
|
|
|
141 </tests>
|
|
|
142 </tool>
|
|
|
143
|
|
|
144
|
|
|
145
|
|
|
146
|
|
|
147 |