annotate gene_family_classifier.xml @ 47:4a6834056e1e draft

Uploaded
author greg
date Tue, 07 Feb 2017 14:24:32 -0500
parents 6c3fa9907d9c
children 906d5277042c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
1 <tool id="plant_tribes_gene_family_classifier" name="Classify gene sequences" version="0.3">
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
2 <description>into precomputed orthologous gene family clusters</description>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
3 <requirements>
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
4 <requirement type="package" version="0.3">plant_tribes_gene_family_classifier</requirement>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
5 </requirements>
315440c6fb44 Uploaded
greg
parents:
diff changeset
6 <stdio>
315440c6fb44 Uploaded
greg
parents:
diff changeset
7 <!-- Anything other than zero is an error -->
315440c6fb44 Uploaded
greg
parents:
diff changeset
8 <exit_code range="1:" />
29
59d1ec149c64 Uploaded
greg
parents: 28
diff changeset
9 <exit_code range=":-1" />
59d1ec149c64 Uploaded
greg
parents: 28
diff changeset
10 <!-- In case the return code has not been set propery check stderr too -->
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
11 <regex match="Error:" />
315440c6fb44 Uploaded
greg
parents:
diff changeset
12 <regex match="Exception:" />
315440c6fb44 Uploaded
greg
parents:
diff changeset
13 </stdio>
315440c6fb44 Uploaded
greg
parents:
diff changeset
14 <command>
315440c6fb44 Uploaded
greg
parents:
diff changeset
15 <![CDATA[
39
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
16 #import os
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
17 #set scaffold_path = $scaffold.fields.path
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
18 #set scaffold_dir = $os.path.split($scaffold_path)[0]
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
19 #set scaffold_selection = $os.path.split($scaffold_path)[1]
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
20
21
795745116516 Uploaded
greg
parents: 20
diff changeset
21 #if str($options_type.options_type_selector) == 'advanced':
17
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
22 #set create_orthogroup_cond = $options_type.create_orthogroup_cond
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
23 #set create_orthogroup = $create_orthogroup_cond.create_orthogroup
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
24 #set specify_single_copy_cond = $options_type.specify_single_copy_cond
46
6c3fa9907d9c Uploaded
greg
parents: 45
diff changeset
25 #set specify_single_copy = $specify_single_copy_cond.specify_single_copy
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
26
46f43a90492a Uploaded
greg
parents: 43
diff changeset
27 #if str($specify_single_copy) == 'yes':
47
4a6834056e1e Uploaded
greg
parents: 46
diff changeset
28 #set single_copy_orthogroup = True
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
29 #set single_copy_fasta_src_dir = $os.path.join('geneFamilyClassification_dir', 'single_copy_fasta')
46f43a90492a Uploaded
greg
parents: 43
diff changeset
30 #set single_copy_fasta_dest_dir = $output_ptsco.extra_files_path
46f43a90492a Uploaded
greg
parents: 43
diff changeset
31 #set single_copy_cond = $specify_single_copy_cond.single_copy_cond
46f43a90492a Uploaded
greg
parents: 43
diff changeset
32 ## FixMe: the single_copy_custom option is not currently supported.
46f43a90492a Uploaded
greg
parents: 43
diff changeset
33 #set single_copy = $single_copy_cond.single_copy
46f43a90492a Uploaded
greg
parents: 43
diff changeset
34 mkdir -p $single_copy_fasta_dest_dir &&
46f43a90492a Uploaded
greg
parents: 43
diff changeset
35 #else:
47
4a6834056e1e Uploaded
greg
parents: 46
diff changeset
36 #set single_copy_orthogroup = False
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
37 #end if
22
035e8b85cdf7 Uploaded
greg
parents: 21
diff changeset
38
21
795745116516 Uploaded
greg
parents: 20
diff changeset
39 #if str($create_orthogroup) == 'yes':
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
40 #set create_ortho_sequences = True
46f43a90492a Uploaded
greg
parents: 43
diff changeset
41 #set orthogroups_fasta_src_dir = $os.path.join('geneFamilyClassification_dir', 'orthogroups_fasta')
21
795745116516 Uploaded
greg
parents: 20
diff changeset
42 #set create_corresponding_coding_sequences_cond = $create_orthogroup_cond.create_corresponding_coding_sequences_cond
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
43
21
795745116516 Uploaded
greg
parents: 20
diff changeset
44 #if str($create_corresponding_coding_sequences_cond.create_corresponding_coding_sequences) == 'yes':
795745116516 Uploaded
greg
parents: 20
diff changeset
45 #set create_corresponding_coding_sequences = True
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
46 #set orthogroups_fasta_dest_dir = $output_ptcgfcs.extra_files_path
21
795745116516 Uploaded
greg
parents: 20
diff changeset
47 #else:
795745116516 Uploaded
greg
parents: 20
diff changeset
48 #set create_corresponding_coding_sequences = False
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
49 #set orthogroups_fasta_dest_dir = $output_ptcgf.extra_files_path
46f43a90492a Uploaded
greg
parents: 43
diff changeset
50 #end if
46f43a90492a Uploaded
greg
parents: 43
diff changeset
51 mkdir -p $orthogroups_fasta_dest_dir &&
21
795745116516 Uploaded
greg
parents: 20
diff changeset
52 #else:
795745116516 Uploaded
greg
parents: 20
diff changeset
53 #set create_ortho_sequences = False
23
1d3e9e154750 Uploaded
greg
parents: 22
diff changeset
54 #set create_corresponding_coding_sequences = False
21
795745116516 Uploaded
greg
parents: 20
diff changeset
55 #end if
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
56 #else:
47
4a6834056e1e Uploaded
greg
parents: 46
diff changeset
57 #set single_copy_orthogroup = False
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
58 #set create_ortho_sequences = False
23
1d3e9e154750 Uploaded
greg
parents: 22
diff changeset
59 #set create_corresponding_coding_sequences = False
4
2ffac03c08fe Uploaded
greg
parents: 3
diff changeset
60 #end if
20
038777896b71 Uploaded
greg
parents: 19
diff changeset
61
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
62 GeneFamilyClassifier
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
63 --proteins '$input'
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
64 --scaffold_dir '$scaffold_dir'
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
65 --scaffold '$scaffold_selection'
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
66 --method $method
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
67 --classifier $save_hmmscan_log_cond.classifier
30
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
68 --num_threads \${GALAXY_SLOTS:-4}
20
038777896b71 Uploaded
greg
parents: 19
diff changeset
69
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
70 #if str($options_type.options_type_selector) == 'advanced':
315440c6fb44 Uploaded
greg
parents:
diff changeset
71 --super_orthogroups $options_type.super_orthogroups
47
4a6834056e1e Uploaded
greg
parents: 46
diff changeset
72 #if $single_copy_orthogroup:
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
73 --single_copy_taxa $single_copy_cond.single_copy_taxa
46f43a90492a Uploaded
greg
parents: 43
diff changeset
74 --taxa_present $single_copy_cond.taxa_present
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
75 #end if
17
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
76 #if str($create_orthogroup) == 'yes':
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
77 --orthogroup_fasta
18
b14a129fe55f Uploaded
greg
parents: 17
diff changeset
78 #if $create_corresponding_coding_sequences:
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
79 --coding_sequences '$create_corresponding_coding_sequences_cond.coding_sequences'
17
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
80 #end if
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
81 #end if
315440c6fb44 Uploaded
greg
parents:
diff changeset
82 #end if
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
83 >/dev/null
20
038777896b71 Uploaded
greg
parents: 19
diff changeset
84
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
85 #if str($save_hmmscan_log_cond.classifier) == 'hmmscan' or str($save_hmmscan_log_cond.classifier) == 'both':
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
86 #if str($save_hmmscan_log_cond.save_hmmscan_log) == 'yes':
15
9d4ec1102803 Uploaded
greg
parents: 14
diff changeset
87 && mv geneFamilyClassification_dir/hmmscan.log $hmmscan_log
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
88 #else:
15
9d4ec1102803 Uploaded
greg
parents: 14
diff changeset
89 && rm geneFamilyClassification_dir/hmmscan.log
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
90 #end if
12
b75510484c16 Uploaded
greg
parents: 11
diff changeset
91 #end if
20
038777896b71 Uploaded
greg
parents: 19
diff changeset
92
14
595088cc480a Uploaded
greg
parents: 13
diff changeset
93 #if $create_ortho_sequences:
18
b14a129fe55f Uploaded
greg
parents: 17
diff changeset
94 #if $create_corresponding_coding_sequences:
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
95 && ls -l $orthogroups_fasta_src_dir | grep f | awk -F ' ' '{print $5"\t"$9}' > $output_ptcgfcs
18
b14a129fe55f Uploaded
greg
parents: 17
diff changeset
96 #else:
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
97 && ls -l $orthogroups_fasta_src_dir | grep f | awk -F ' ' '{print $5"\t"$9}' > $output_ptcgf
18
b14a129fe55f Uploaded
greg
parents: 17
diff changeset
98 #end if
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
99 && mv $orthogroups_fasta_src_dir/* $orthogroups_fasta_dest_dir || true
4
2ffac03c08fe Uploaded
greg
parents: 3
diff changeset
100 #end if
20
038777896b71 Uploaded
greg
parents: 19
diff changeset
101
47
4a6834056e1e Uploaded
greg
parents: 46
diff changeset
102 #if $single_copy_orthogroup:
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
103 && ls -l $single_copy_fasta_src_dir | grep f | awk -F ' ' '{print $5"\t"$9}' > $output_ptsco
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
104 && mv $single_copy_fasta_src_dir/* $single_copy_fasta_dest_dir || true
46f43a90492a Uploaded
greg
parents: 43
diff changeset
105 #end if
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
106 ]]>
315440c6fb44 Uploaded
greg
parents:
diff changeset
107 </command>
315440c6fb44 Uploaded
greg
parents:
diff changeset
108 <inputs>
315440c6fb44 Uploaded
greg
parents:
diff changeset
109 <param name="input" format="fasta" type="data" label="Amino acids (proteins) sequences fasta file"/>
315440c6fb44 Uploaded
greg
parents:
diff changeset
110 <param name="scaffold" type="select" label="Orthogroups or gene families proteins scaffold">
315440c6fb44 Uploaded
greg
parents:
diff changeset
111 <options from_data_table="plant_tribes_scaffolds" />
39
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
112 <validator type="no_options" message="No PlantTribes scaffolds are available. Use the PlantTribes Scaffolds Download Data Manager tool in Galaxy to install and populate the PlantTribes scaffolds data table."/>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
113 </param>
315440c6fb44 Uploaded
greg
parents:
diff changeset
114 <param name="method" type="select" label="Protein clustering method">
315440c6fb44 Uploaded
greg
parents:
diff changeset
115 <option value="gfam" selected="true">GFam</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
116 <option value="orthofinder">OrthoFinder</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
117 <option value="orthomcl">OrthoMCL</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
118 </param>
13
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
119 <conditional name="save_hmmscan_log_cond">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
120 <param name="classifier" type="select" label="Protein classification method">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
121 <option value="blastp" selected="true">blastp</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
122 <option value="hmmscan">HMMScan</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
123 <option value="both">Both blastp and HMMScan</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
124 </param>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
125 <when value="blastp" />
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
126 <when value="hmmscan">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
127 <param name="save_hmmscan_log" type="select" label="Save hmmscan log?" help="Save the hmmscan log in an additional output dataset">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
128 <option value="no" selected="true">No</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
129 <option value="yes">Yes</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
130 </param>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
131 </when>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
132 <when value="both">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
133 <param name="save_hmmscan_log" type="select" label="Save hmmscan log?" help="Save the hmmscan log in an additional output dataset">
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
134 <option value="no" selected="true">No</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
135 <option value="yes">Yes</option>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
136 </param>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
137 </when>
cddbb2f13c28 Uploaded
greg
parents: 12
diff changeset
138 </conditional>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
139 <conditional name="options_type">
315440c6fb44 Uploaded
greg
parents:
diff changeset
140 <param name="options_type_selector" type="select" label="Options Configuration">
315440c6fb44 Uploaded
greg
parents:
diff changeset
141 <option value="basic" selected="true">Basic</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
142 <option value="advanced">Advanced</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
143 </param>
315440c6fb44 Uploaded
greg
parents:
diff changeset
144 <when value="basic" />
315440c6fb44 Uploaded
greg
parents:
diff changeset
145 <when value="advanced">
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
146 <param name="super_orthogroups" type="select" label="Super Orthogroups" help="Secondary MCL clusters of orthogroups">
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
147 <option value="min_evalue" selected="true">Minimum e-value</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
148 <option value="avg_evalue">Average e-value</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
149 </param>
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
150 <conditional name="specify_single_copy_cond">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
151 <param name="specify_single_copy" type="select" label="Specify single copy orthogroup selection?">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
152 <option value="no" selected="true">No</option>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
153 <option value="yes">Yes</option>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
154 </param>
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
155 <when value="no"/>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
156 <when value="yes">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
157 <conditional name="single_copy_cond">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
158 <param name="single_copy" type="select" label="Select single copy configuration">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
159 <!--
46f43a90492a Uploaded
greg
parents: 43
diff changeset
160 FixMe: single_copy_custom is not currently supported because the
46f43a90492a Uploaded
greg
parents: 43
diff changeset
161 ~/config/*.singleCopy.config files are not easy to manage by a suer
46f43a90492a Uploaded
greg
parents: 43
diff changeset
162 and the GeneFamilyClassifier pipeline must be enhanced to provide an
46f43a90492a Uploaded
greg
parents: 43
diff changeset
163 optional parameter for the hard-coded path to the config.
46f43a90492a Uploaded
greg
parents: 43
diff changeset
164 <option value="custom" selected="true">Single copy orthogroup custom</option>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
165 -->
46f43a90492a Uploaded
greg
parents: 43
diff changeset
166 <option value="taxa">Minumum single copy taxa required in orthogroup</option>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
167 </param>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
168 <when value="custom" />
46f43a90492a Uploaded
greg
parents: 43
diff changeset
169 <when value="taxa">
46f43a90492a Uploaded
greg
parents: 43
diff changeset
170 <param name="single_copy_taxa" type="integer" value="20" label="Minumum single copy taxa required in orthogroup"/>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
171 <param name="taxa_present" type="integer" value="21" label="Minumum taxa required in single copy orthogroup"/>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
172 </when>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
173 </conditional>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
174 </when>
315440c6fb44 Uploaded
greg
parents:
diff changeset
175 </conditional>
315440c6fb44 Uploaded
greg
parents:
diff changeset
176 <conditional name="create_orthogroup_cond">
315440c6fb44 Uploaded
greg
parents:
diff changeset
177 <param name="create_orthogroup" type="select" label="Create orthogroup fasta files?">
315440c6fb44 Uploaded
greg
parents:
diff changeset
178 <option value="no" selected="true">No</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
179 <option value="yes">Yes</option>
315440c6fb44 Uploaded
greg
parents:
diff changeset
180 </param>
315440c6fb44 Uploaded
greg
parents:
diff changeset
181 <when value="no" />
315440c6fb44 Uploaded
greg
parents:
diff changeset
182 <when value="yes">
17
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
183 <conditional name="create_corresponding_coding_sequences_cond">
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
184 <param name="create_corresponding_coding_sequences" type="select" label="Create corresponding coding sequences?">
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
185 <option value="no" selected="true">No</option>
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
186 <option value="yes">Yes</option>
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
187 </param>
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
188 <when value="no" />
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
189 <when value="yes">
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
190 <param name="coding_sequences" format="fasta" type="data" label="Corresponding coding sequences (CDS) fasta file"/>
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
191 </when>
cb7487bdab99 Uploaded
greg
parents: 16
diff changeset
192 </conditional>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
193 </when>
315440c6fb44 Uploaded
greg
parents:
diff changeset
194 </conditional>
315440c6fb44 Uploaded
greg
parents:
diff changeset
195 </when>
315440c6fb44 Uploaded
greg
parents:
diff changeset
196 </conditional>
315440c6fb44 Uploaded
greg
parents:
diff changeset
197 </inputs>
315440c6fb44 Uploaded
greg
parents:
diff changeset
198 <outputs>
15
9d4ec1102803 Uploaded
greg
parents: 14
diff changeset
199 <data name="hmmscan_log" format="txt" label="Protein classification hmmscan.log on ${on_string}">
9d4ec1102803 Uploaded
greg
parents: 14
diff changeset
200 <filter>save_hmmscan_log_cond['classifier'] in ['hmmscan', 'both'] and save_hmmscan_log_cond['save_hmmscan_log'] == 'yes'</filter>
9d4ec1102803 Uploaded
greg
parents: 14
diff changeset
201 </data>
38
b63f96ff6708 Uploaded
greg
parents: 37
diff changeset
202 <data name="output_ptcgf" format="ptcgf" label="Gene family clusters on ${on_string}">
33
c1a3b77de0f0 Uploaded
greg
parents: 32
diff changeset
203 <filter>options_type['options_type_selector'] == 'advanced' and options_type['create_orthogroup_cond']['create_orthogroup'] == 'yes' and options_type['create_orthogroup_cond']['create_corresponding_coding_sequences_cond']['create_corresponding_coding_sequences'] == 'no'</filter>
31
80e9d6e098ec Uploaded
greg
parents: 30
diff changeset
204 </data>
38
b63f96ff6708 Uploaded
greg
parents: 37
diff changeset
205 <data name="output_ptcgfcs" format="ptcgfcs" label="Gene family clusters and corresponding coding sequences on ${on_string}">
31
80e9d6e098ec Uploaded
greg
parents: 30
diff changeset
206 <filter>options_type['options_type_selector'] == 'advanced' and options_type['create_orthogroup_cond']['create_orthogroup'] == 'yes' and options_type['create_orthogroup_cond']['create_corresponding_coding_sequences_cond']['create_corresponding_coding_sequences'] == 'yes'</filter>
9
c7010d37df2c Uploaded
greg
parents: 8
diff changeset
207 </data>
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
208 <data name="output_ptsco" format="txt" label="Single copy orthogroup on ${on_string}">
44
46f43a90492a Uploaded
greg
parents: 43
diff changeset
209 <filter>options_type['options_type_selector'] == 'advanced' and options_type['specify_single_copy_cond']['specify_single_copy'] == 'yes'</filter>
46f43a90492a Uploaded
greg
parents: 43
diff changeset
210 </data>
30
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
211 <collection name="orthos" type="list">
12
b75510484c16 Uploaded
greg
parents: 11
diff changeset
212 <discover_datasets pattern="__name__" directory="geneFamilyClassification_dir" visible="false" ext="tabular" />
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
213 </collection>
315440c6fb44 Uploaded
greg
parents:
diff changeset
214 </outputs>
315440c6fb44 Uploaded
greg
parents:
diff changeset
215 <tests>
39
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
216 <!-- Not sure how to test this since the tool requires scaffolds data which is extremely large and installed using a Data Manager -->
c4f809cd2f38 Uploaded
greg
parents: 38
diff changeset
217 <!--
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
218 <test>
30
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
219 <param name="input" value="transcripts.cleaned.nr.pep" ftype="fasta" />
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
220 <param name="scaffold" value="22Gv1.1"/>
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
221 <param name="method" value="orthomcl"/>
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
222 <param name="classifier" value="blastp"/>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
223 <param name="dereplicate" value="yes"/>
315440c6fb44 Uploaded
greg
parents:
diff changeset
224 <param name="min_length" value="200"/>
315440c6fb44 Uploaded
greg
parents:
diff changeset
225 <output_collection name="orthos" type="list">
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
226 <element name="proteins.blastp.22Gv1.1" file="proteins.blastp.22Gv1.1" ftype="tabular"/>
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
227 <element name="proteins.blastp.22Gv1.1.bestOrthos" file="proteins.blastp.22Gv1.1.bestOrthos" ftype="tabular"/>
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
228 <element name="proteins.blastp.22Gv1.1.bestOrthos.summary" file="proteins.blastp.22Gv1.1.bestOrthos.summary" ftype="tabular"/>
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
229 </output_collection>
315440c6fb44 Uploaded
greg
parents:
diff changeset
230 </test>
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
231 -->
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
232 </tests>
315440c6fb44 Uploaded
greg
parents:
diff changeset
233 <help>
315440c6fb44 Uploaded
greg
parents:
diff changeset
234 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
235 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. This tool classifies gene
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
236 sequences into precomputed orthologous gene family clusters using either blastp (faster), HMMScan (slower but more sensitive
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
237 to remote homologs) or both (more exhaustive).
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
238
30
e9d9632762ca Uploaded
greg
parents: 29
diff changeset
239 This tool accepts any of the following as input:
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
240
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
241 * the postprocessed assemblies produced by the **Postprocess de novo assembly transcripts into putative coding sequences** tool
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
242 * externally predicted coding sequences and their corresponding amino acid translations derived from a transcriptome assembly
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
243 * gene predictions from a sequenced genome
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
244
315440c6fb44 Uploaded
greg
parents:
diff changeset
245 -----
315440c6fb44 Uploaded
greg
parents:
diff changeset
246
315440c6fb44 Uploaded
greg
parents:
diff changeset
247 **Options**
315440c6fb44 Uploaded
greg
parents:
diff changeset
248
315440c6fb44 Uploaded
greg
parents:
diff changeset
249 * **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data.
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
250 * **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters).
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
251 * **Protein classification method** - blastp (faster), HMMScan (slower but more sensative to the remote homologs) or both (more exhaustive).
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
252 * **Super Orthogroups** - Secondary MCL clusters of orthogroups.
45
916fb0014f89 Uploaded
greg
parents: 44
diff changeset
253 * **Specify single copy orthogroup selection?** - Select 'Yes' to specify one of 'Single copy orthogroup custom' (not yet supported) or 'Minumum single copy taxa required in orthogroup'.
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
254 * **Minumum single copy taxa required in orthogroup** - Used with "Minumum single copy taxa required in orthogroup" configuration only.
315440c6fb44 Uploaded
greg
parents:
diff changeset
255 * **Minumum taxa required in single copy orthogroup** - Used with "Minumum single copy taxa required in orthogroup" configuration only.
315440c6fb44 Uploaded
greg
parents:
diff changeset
256 * **Corresponding coding sequences (CDS) fasta file** - Used only when selecting "Create orthogroup fasta files?".
315440c6fb44 Uploaded
greg
parents:
diff changeset
257
315440c6fb44 Uploaded
greg
parents:
diff changeset
258 </help>
315440c6fb44 Uploaded
greg
parents:
diff changeset
259 <citations>
315440c6fb44 Uploaded
greg
parents:
diff changeset
260 <citation type="bibtex">
315440c6fb44 Uploaded
greg
parents:
diff changeset
261 @unpublished{None,
28
a63b610ec5bd Uploaded
greg
parents: 27
diff changeset
262 author = {Eric Wafula},
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
263 title = {None},
315440c6fb44 Uploaded
greg
parents:
diff changeset
264 year = {None},
35
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
265 url = {https://github.com/dePamphilis/PlantTribes}
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
266 }</citation>
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
267 <citation type="doi">10.1186/1471-2105-10-421</citation>
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
268 <citation type="bibtex">
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
269 @unpublished{None,
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
270 author = {None},
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
271 title = {HMMER 3.1+ hmmscan search sequence(s) against a profile database},
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
272 year = {2013},
0fc60c5cb719 Uploaded
greg
parents: 34
diff changeset
273 url = {http://hmmer.org/}
0
315440c6fb44 Uploaded
greg
parents:
diff changeset
274 }</citation>
315440c6fb44 Uploaded
greg
parents:
diff changeset
275 </citations>
315440c6fb44 Uploaded
greg
parents:
diff changeset
276 </tool>