comparison gene_family_classifier.xml @ 35:0fc60c5cb719 draft

Uploaded
author greg
date Thu, 02 Feb 2017 10:06:11 -0500
parents 9a60634252fd
children d485da50616b
comparison
equal deleted inserted replaced
34:9a60634252fd 35:0fc60c5cb719
11 <regex match="Error:" /> 11 <regex match="Error:" />
12 <regex match="Exception:" /> 12 <regex match="Exception:" />
13 </stdio> 13 </stdio>
14 <command> 14 <command>
15 <![CDATA[ 15 <![CDATA[
16 #import os
17 #set scaffold_path = $scaffold.fields.path
18 #set scaffold_dir = $os.path.split($scaffold_path)[0]
19 #set scaffold_selection = $os.path.split($scaffold_path)[1]
20
16 #if str($options_type.options_type_selector) == 'advanced': 21 #if str($options_type.options_type_selector) == 'advanced':
17 #set create_orthogroup_cond = $options_type.create_orthogroup_cond 22 #set create_orthogroup_cond = $options_type.create_orthogroup_cond
18 #set create_orthogroup = $create_orthogroup_cond.create_orthogroup 23 #set create_orthogroup = $create_orthogroup_cond.create_orthogroup
19 24
20 #if str($create_orthogroup) == 'yes': 25 #if str($create_orthogroup) == 'yes':
23 #set create_corresponding_coding_sequences = True 28 #set create_corresponding_coding_sequences = True
24 #else: 29 #else:
25 #set create_corresponding_coding_sequences = False 30 #set create_corresponding_coding_sequences = False
26 #end if 31 #end if
27 32
28 #import os
29 #set create_ortho_sequences = True 33 #set create_ortho_sequences = True
30 #set orthogroups_fasta_src_dir = $os.path.join('geneFamilyClassification_dir', 'orthogroups_fasta') 34 #set orthogroups_fasta_src_dir = $os.path.join('geneFamilyClassification_dir', 'orthogroups_fasta')
31 #if $create_corresponding_coding_sequences: 35 #if $create_corresponding_coding_sequences:
32 #set dest_dir = $output_pgfccs.extra_files_path 36 #set dest_dir = $output_pgfccs.extra_files_path
33 #else: 37 #else:
42 #set create_ortho_sequences = False 46 #set create_ortho_sequences = False
43 #set create_corresponding_coding_sequences = False 47 #set create_corresponding_coding_sequences = False
44 #end if 48 #end if
45 49
46 GeneFamilyClassifier 50 GeneFamilyClassifier
47 --proteins "$input" 51 --proteins '$input'
48 --scaffold_dir "${GALAXY_DATA_INDEX_DIR}/plant_tribes/scaffolds" 52 --scaffold_dir '$scaffold_dir'
49 --scaffold "$scaffold" 53 --scaffold '$scaffold_selection'
50 --method $method 54 --method $method
51 --classifier $save_hmmscan_log_cond.classifier 55 --classifier $save_hmmscan_log_cond.classifier
52 --num_threads \${GALAXY_SLOTS:-4} 56 --num_threads \${GALAXY_SLOTS:-4}
53 57
54 #if str($options_type.options_type_selector) == 'advanced': 58 #if str($options_type.options_type_selector) == 'advanced':
58 --taxa_present $options_type.single_copy_cond.taxa_present 62 --taxa_present $options_type.single_copy_cond.taxa_present
59 #end if 63 #end if
60 #if str($create_orthogroup) == 'yes': 64 #if str($create_orthogroup) == 'yes':
61 --orthogroup_fasta 65 --orthogroup_fasta
62 #if $create_corresponding_coding_sequences: 66 #if $create_corresponding_coding_sequences:
63 --coding_sequences "$create_corresponding_coding_sequences_cond.coding_sequences" 67 --coding_sequences '$create_corresponding_coding_sequences_cond.coding_sequences'
64 #end if 68 #end if
65 #end if 69 #end if
66 #end if 70 #end if
67 71
68 #if str($save_hmmscan_log_cond.classifier) == 'hmmscan' or str($save_hmmscan_log_cond.classifier) == 'both': 72 #if str($save_hmmscan_log_cond.classifier) == 'hmmscan' or str($save_hmmscan_log_cond.classifier) == 'both':
73 #end if 77 #end if
74 #end if 78 #end if
75 79
76 #if $create_ortho_sequences: 80 #if $create_ortho_sequences:
77 #if $create_corresponding_coding_sequences: 81 #if $create_corresponding_coding_sequences:
78 && echo "# Precomputed orthologous gene family clusters with corresponding coding sequences: `ls $orthogroups_fasta_src_dir | grep f | wc -l` files" > $output_pgfccs 82 && echo '# Precomputed orthologous gene family clusters with corresponding coding sequences: `ls $orthogroups_fasta_src_dir | grep f | wc -l` files' > $output_pgfccs
79 && ls -al $orthogroups_fasta_src_dir | grep f >> $output_pgfccs 83 && ls -al $orthogroups_fasta_src_dir | grep f >> $output_pgfccs
80 #else: 84 #else:
81 && echo "# Precomputed orthologous gene family clusters: `ls $orthogroups_fasta_src_dir | grep f | wc -l` files" > $output_pgfc 85 && echo '# Precomputed orthologous gene family clusters: `ls $orthogroups_fasta_src_dir | grep f | wc -l` files' > $output_pgfc
82 && ls -al $orthogroups_fasta_src_dir | grep f >> $output_pgfc 86 && ls -al $orthogroups_fasta_src_dir | grep f >> $output_pgfc
83 #end if 87 #end if
84 && mv $orthogroups_fasta_src_dir/* $dest_dir || true 88 && mv $orthogroups_fasta_src_dir/* $dest_dir || true
85 #end if 89 #end if
86 90
174 <collection name="orthos" type="list"> 178 <collection name="orthos" type="list">
175 <discover_datasets pattern="__name__" directory="geneFamilyClassification_dir" visible="false" ext="tabular" /> 179 <discover_datasets pattern="__name__" directory="geneFamilyClassification_dir" visible="false" ext="tabular" />
176 </collection> 180 </collection>
177 </outputs> 181 </outputs>
178 <tests> 182 <tests>
183 <!-- Not sure how to test this since the tool requires scaffolds data which is extremely large and installed using a Data Manager -->
184 <!--
179 <test> 185 <test>
180 <!-- Not sure how to test this since the tool requires scaffolds data which is extremely large and installed using a Data Manager -->
181 <param name="input" value="transcripts.cleaned.nr.pep" ftype="fasta" /> 186 <param name="input" value="transcripts.cleaned.nr.pep" ftype="fasta" />
182 <param name="scaffold" value="22Gv1.1"/> 187 <param name="scaffold" value="22Gv1.1"/>
183 <param name="method" value="orthomcl"/> 188 <param name="method" value="orthomcl"/>
184 <param name="classifier" value="blastp"/> 189 <param name="classifier" value="blastp"/>
185 <param name="dereplicate" value="yes"/> 190 <param name="dereplicate" value="yes"/>
186 <param name="min_length" value="200"/> 191 <param name="min_length" value="200"/>
187 <output_collection name="orthos" type="list"> 192 <output_collection name="orthos" type="list">
188 <element name="proteins.blastp.22Gv1.1" file="proteins.blastp.22Gv1.1" ftype="tabular" compare="contains"/> 193 <element name="proteins.blastp.22Gv1.1" file="proteins.blastp.22Gv1.1" ftype="tabular"/>
189 <element name="proteins.blastp.22Gv1.1.bestOrthos" file="proteins.blastp.22Gv1.1.bestOrthos" ftype="tabular" compare="contains"/> 194 <element name="proteins.blastp.22Gv1.1.bestOrthos" file="proteins.blastp.22Gv1.1.bestOrthos" ftype="tabular"/>
190 <element name="proteins.blastp.22Gv1.1.bestOrthos.summary" file="proteins.blastp.22Gv1.1.bestOrthos.summary" ftype="tabular" compare="contains"/> 195 <element name="proteins.blastp.22Gv1.1.bestOrthos.summary" file="proteins.blastp.22Gv1.1.bestOrthos.summary" ftype="tabular"/>
191 </output_collection> 196 </output_collection>
192 </test> 197 </test>
198 -->
193 </tests> 199 </tests>
194 <help> 200 <help>
195 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of 201 This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of
196 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. This tool classifies gene 202 complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. This tool classifies gene
197 sequences into precomputed orthologous gene family clusters using either blastp (faster), HMMScan (slower but more sensitive 203 sequences into precomputed orthologous gene family clusters using either blastp (faster), HMMScan (slower but more sensitive
220 <citation type="bibtex"> 226 <citation type="bibtex">
221 @unpublished{None, 227 @unpublished{None,
222 author = {Eric Wafula}, 228 author = {Eric Wafula},
223 title = {None}, 229 title = {None},
224 year = {None}, 230 year = {None},
225 eprint = {None}, 231 url = {https://github.com/dePamphilis/PlantTribes}
226 url = {None} 232 }</citation>
233 <citation type="doi">10.1186/1471-2105-10-421</citation>
234 <citation type="bibtex">
235 @unpublished{None,
236 author = {None},
237 title = {HMMER 3.1+ hmmscan search sequence(s) against a profile database},
238 year = {2013},
239 url = {http://hmmer.org/}
227 }</citation> 240 }</citation>
228 </citations> 241 </citations>
229 </tool> 242 </tool>