annotate interproscan.xml @ 0:98c6e970cbc1 draft

Uploaded
author bgruening
date Thu, 22 Aug 2013 08:07:13 -0400
parents
children 2d56d3ae499c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
1 <tool id="interproscan" name="Interproscan functional predictions of ORFs" version="5.0.0">
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
2 <description>Interproscan functional predictions of ORFs</description>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
3 <requirements>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
4 <requirement type="package">signalp</requirement>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
5 <requirement type="package">phobius</requirement>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package">tmhmm</requirement>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
7 <requirement type="set_environment">INTERPROSCAN_SCRIPT_PATH</requirement>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
8 </requirements>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
9 <command>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
10 #import os
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
11 interproscan.sh -dp --fasta $infile --seqtype $seqtype -f $oformat --applications $appl --tempdir \$TEMP
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
12
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
13 $pathways
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
14 $goterms
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
15 $iprlookup
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
16
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
17 #if str($oformat) in ['SVG', 'HTML']:
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
18 --output-file-base $outfile
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
19 2>&#38;1;
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
20 mkdir -p $outfile.files_path;
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
21 #set temp_archive_file = str($outfile) + '.' + str($oformat).lower() + '.tar.gz'
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
22 tar -C $outfile.files_path -xvmzf $temp_archive_file;
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
23 python \$INTERPROSCAN_SCRIPT_PATH/create_index.py $outfile $outfile.files_path;
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
24 rm $temp_archive_file
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
25 #else:
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
26 -o $outfile
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
27 2>&#38;1
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
28 #end if
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
29
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
30 </command>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
31 <inputs>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
32 <param name="infile" type="data" format="fasta" label="Protein Fasta File"/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
33
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
34 <param name="seqtype" type="select" label="Type of the input sequences" help="">
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
35 <option value="p" selected="true">Protein</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
36 <option value="n">DNA / RNA</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
37 </param>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
38
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
39 <param name="appl" type="select" multiple="True" display="checkboxes" label="Applications to run" help="Select your programm.">
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
40 <option value="TIGRFAM" selected="true">TIGRFAM: protein families based on Hidden Markov Models or HMMs</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
41 <option value="PIRSF" selected="true">PIRSF: non-overlapping clustering of UniProtKB sequences into a hierarchical order (evolutionary relationships)</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
42 <option value="ProDom" selected="true">ProDom: set of protein domain families generated from the UniProtKB</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
43 <option value="Panther" selected="true">Panther: Protein ANalysis THrough Evolutionary Relationships</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
44 <option value="SMART" selected="true">SMART: identification and analysis of domain architectures based on Hidden Markov Models or HMMs</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
45 <option value="PrositeProfiles" selected="true">PROSITE Profiles: protein domains, families and functional sites as well as associated profiles to identify them</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
46 <option value="PrositePatterns" selected="true">PROSITE Pattern: protein domains, families and functional sites as well as associated patterns to identify them</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
47 <option value="HAMAP" selected="true">HAMAP: High-quality Automated Annotation of Microbial Proteomes</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
48 <option value="PfamA" selected="true">PfamA: protein families, each represented by multiple sequence alignments and hidden Markov models</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
49 <option value="PRINTS" selected="true">PRINTS: group of conserved motifs (fingerprints) used to characterise a protein family</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
50 <option value="SuperFamily" selected="true">SUPERFAMILY: database of structural and functional annotation</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
51 <option value="Coils" selected="true">Coils: Prediction of Coiled Coil Regions in Proteins</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
52 <option value="Gene3d" selected="true">Gene3d: Structural assignment for whole genes and genomes using the CATH domain structure database</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
53 <option value="SignalP-GRAM_POSITIVE" selected="false">SignalP Gram Positive Bacteria</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
54 <option value="SignalP-GRAM_NEGATIVE" selected="false">SignalP Gram Negative Bacteria</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
55 <option value="SignalP-EUK" selected="true">SignalP Eukaryotic Bacteria</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
56 <option value="Phobius" selected="true">Phobius: combined transmembrane topology and signal peptide predictor</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
57 <option value="TMHMM" selected="true">TMHMM: Prediction of transmembrane helices in proteins</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
58 </param>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
59
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
60 <param name="pathways" truevalue="--pathways" falsevalue="" checked="True" type="boolean" label="Include pathway information" help="Option that provides mappings from matches to pathway information, which is based on the matched manually curated InterPro entries."/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
61 <param name="goterms" truevalue="--goterms" falsevalue="" checked="True" type="boolean" label="Include Gene Ontology (GO) mappings" />
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
62 <param name="iprlookup" truevalue="--iprlookup" falsevalue="" checked="False" type="boolean" label="Provide mappings from matched member database signatures to the InterPro entries that they are integrated into" />
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
63
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
64 <param name="oformat" type="select" label="Output format" help="Please select a output format.">
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
65 <option value="TSV" selected="true">Tab-separated values format (TSV)</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
66 <option value="GFF3">GFF3</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
67 <option value="SVG">SVG</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
68 <option value="HTML">HTML</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
69 <option value="XML">XML</option>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
70 </param>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
71
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
72 </inputs>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
73 <outputs>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
74
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
75 <data format="tabular" name="outfile" label="Interproscan calculation on ${on_string}">
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
76 <change_format>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
77 <when input="oformat" value="HTML" format="html"/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
78 <when input="oformat" value="XML" format="xml"/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
79 <when input="oformat" value="SVG" format="html"/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
80 <when input="oformat" value="GFF3" format="gff"/>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
81 </change_format>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
82 </data>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
83
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
84 </outputs>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
85 <requirements>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
86 </requirements>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
87 <help>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
88
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
89 **What it does**
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
90
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
91 Interproscan is a batch tool to query the Interpro database. It provides annotations based on multiple searches of profile and other functional databases.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
92
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
93
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
94 #####
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
95 Input
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
96 #####
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
97
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
98 Required is a FASTA file containing protein or nucleotide sequences.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
99
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
100
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
101 ######
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
102 Output
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
103 ######
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
104
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
105 In this version of InterProScan_, you can retrieve output in any of the following five formats:
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
106
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
107 * TSV: a simple tab-delimited file format
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
108 * XML: the new "IMPACT" XML format (XSD available here_).
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
109 * GFF: The `GFF 3.0`_ format
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
110 * HTML: An HTML representation of the protein matches
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
111 * SVG: An Scalable Vector Graphics representation of the protein matches
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
112
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
113
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
114 .. _`GFF3 3.0`: http://gmod.org/wiki/GFF#GFF3_Format
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
115 .. _here: http://www.ebi.ac.uk/interpro/resources/schemas/interproscan5
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
116
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
117
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
118 Previous versions of InterProScan_ 5 (I5RC1 - I5RC6) could only output data for nucleotide sequences in XML and GFF3. This has now changed and InterProScan_ 5 can output results for nucleotide sequences in all formats. *Please note* you can only trace protein match positions to the original nucleotide sequence with GFF3 and XML.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
119
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
120 You can override the default output formats using the *-f* option, e.g.::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
121
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
122 ./interproscan.sh -f XML -f HTML -i /path/to/sequences.fasta -b /path/to/output_file
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
123
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
124 or
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
125
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
126 ::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
127
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
128 ./interproscan.sh -f XML, HTML -i /path/to/sequences.fasta -b /path/to/output_file
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
129
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
130
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
131 These two equivalent commands will output the results in XML and HTML format.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
132
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
133 Tab-separated values format (TSV)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
134 =================================
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
135
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
136 Basic tab delimited format.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
137
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
138
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
139 Example Output
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
140 --------------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
141
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
142 ::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
143
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
144 P51587 14086411a2cdf1c4cba63020e1622579 3418 Pfam PF09103 BRCA2, oligonucleotide/oligosaccharide-binding, domain 1 2670 2799 7.9E-43 T 15-03-2013
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
145 P51587 14086411a2cdf1c4cba63020e1622579 3418 ProSiteProfiles PS50138 BRCA2 repeat profile. 1002 1036 0.0 T 18-03-2013 IPR002093 BRCA2 repeat GO:0005515|GO:0006302
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
146 P51587 14086411a2cdf1c4cba63020e1622579 3418 Gene3D G3DSA:2.40.50.140 2966 3051 3.1E-52 T 15-03-2013
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
147 ...
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
148
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
149
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
150 The TSV format presents the match data in columns as follows:
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
151
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
152 - Protein Accession (e.g. P51587)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
153 - Sequence MD5 digest (e.g. 14086411a2cdf1c4cba63020e1622579)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
154 - Sequence Length (e.g. 3418)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
155 - Analysis (e.g. Pfam / PRINTS / Gene3D)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
156 - Signature Accession (e.g. PF09103 / G3DSA:2.40.50.140)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
157 - Signature Description (e.g. BRCA2 repeat profile)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
158 - Start location
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
159 - Stop location
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
160 - Score - is the e-value of the match reported by member database method (e.g. 3.1E-52)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
161 - Status - is the status of the match (T: true)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
162 - Date - is the date of the run
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
163 - (InterProScan_ annotations - accession (e.g. IPR002093) - optional column; only displayed if -iprscan option is switched on)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
164 - (InterProScan_ annotations - description (e.g. BRCA2 repeat) - optional column; only displayed if -iprscan option is switched on)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
165 - (GO annotations (e.g. GO:0005515) - optional column; only displayed if --goterms option is switched on)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
166 - (Pathways annotations (e.g. REACT_71) - optional column; only displayed if --pathways option is switched on)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
167
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
168
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
169 Extensible Markup Language (XML)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
170 ================================
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
171
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
172 XML representation of the matches - this is the richest form of the data. The XML Schema Definition (XSD) is available [http://www.ebi.ac.uk/interpro/resources/schemas/interproscan5 here].
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
173
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
174 Example Output
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
175 --------------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
176
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
177 ::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
178
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
179 .. image:: $PATH_TO_IMAGES/example_xml_output.png
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
180
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
181
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
182
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
183 Generic Feature Format Version 3 (GFF3)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
184 =======================================
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
185
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
186 The GFF3 format is a flat tab-delimited file, which is much richer then the TSV output format. It allows you to trace back from matches to predicted proteins and to nucleic acid sequences. It also contains a FASTA format representation of the predicted protein sequences and their matches. You will find a documentation of all the columns and attributes used on [http://www.sequenceontology.org/gff3.shtml].
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
187
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
188 Example Output
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
189 --------------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
190
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
191 ::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
192
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
193 ##gff-version 3
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
194 ##feature-ontology http://song.cvs.sourceforge.net/viewvc/song/ontology/sofa.obo?revision=1.269
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
195 ##sequence-region AACH01000027 1 1347
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
196 ##seqid|source|type|start|end|score|strand|phase|attributes
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
197 AACH01000027 provided_by_user nucleic_acid 1 1347 . + . Name=AACH01000027;md5=b2a7416cb92565c004becb7510f46840;ID=AACH01000027
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
198 AACH01000027 getorf ORF 1 1347 . + . Name=AACH01000027.2_21;Target=pep_AACH01000027_1_1347 1 449;md5=b2a7416cb92565c004becb7510f46840;ID=orf_AACH01000027_1_1347
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
199 AACH01000027 getorf polypeptide 1 449 . + . md5=fd0743a673ac69fb6e5c67a48f264dd5;ID=pep_AACH01000027_1_1347
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
200 AACH01000027 Pfam protein_match 84 314 1.2E-45 + . Name=PF00696;signature_desc=Amino acid kinase family;Target=null 84 314;status=T;ID=match$8_84_314;Ontology_term="GO:0008652";date=15-04-2013;Dbxref="InterPro:IPR001048","Reactome:REACT_13"
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
201 ##sequence-region 2
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
202 ...
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
203 >pep_AACH01000027_1_1347
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
204 LVLLAAFDCIDDTKLVKQIIISEIINSLPNIVNDKYGRKVLLYLLSPRDPAHTVREIIEV
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
205 LQKGDGNAHSKKDTEIRRREMKYKRIVFKVGTSSLTNEDGSLSRSKVKDITQQLAMLHEA
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
206 GHELILVSSGAIAAGFGALGFKKRPTKIADKQASAAVGQGLLLEEYTTNLLLRQIVSAQI
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
207 LLTQDDFVDKRRYKNAHQALSVLLNRGAIPIINENDSVVIDELKVGDNDTLSAQVAAMVQ
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
208 ADLLVFLTDVDGLYTGNPNSDPRAKRLERIETINREIIDMAGGAGSSNGTGGMLTKIKAA
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
209 TIATESGVPVYICSSLKSDSMIEAAEETEDGSYFVAQEKGLRTQKQWLAFYAQSQGSIWV
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
210 DKGAAEALSQYGKSLLLSGIVEAEGVFSYGDIVTVFDKESGKSLGKGRVQFGASALEDML
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
211 RSQKAKGVLIYRDDWISITPEIQLLFTEF
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
212 ...
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
213 >match$8_84_314
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
214 KRIVFKVGTSSLTNEDGSLSRSKVKDITQQLAMLHEAGHELILVSSGAIAAGFGALGFKK
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
215 RPTKIADKQASAAVGQGLLLEEYTTNLLLRQIVSAQILLTQDDFVDKRRYKNAHQALSVL
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
216 LNRGAIPIINENDSVVIDELKVGDNDTLSAQVAAMVQADLLVFLTDVDGLYTGNPNSDPR
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
217 AKRLERIETINREIIDMAGGAGSSNGTGGMLTKIKAATIATESGVPVYICS
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
218
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
219
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
220 Scalable Vector Graphics (SVG) and HyperText Markup Language (HTML)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
221 ====================================================================
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
222
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
223 InterProScan_ 5 outputs a single HTML/SVG file for each protein sequence analysed. The HTML/SVG file(s) are compressed into a single gzipped tar archive (or "tarball") that includes the resources (images, Javascript, style etc) to render the pages/images in a browser or image viewer. (Note that from version 5RC4, the SVG format has no external dependencies.)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
224
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
225 The tarball will be named something similar to::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
226
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
227 base_output_file_name.html.tar.gz OR base_output_file_name.svg.tar.gz
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
228
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
229
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
230 To access the HTML pages/SVG images, unzip the tarball using a command like:
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
231
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
232 tar -xvzf base_output_file_name.html(svg).tar.gz
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
233
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
234 You can then open the unzipped HTML/SVG files in any browser or image viewer (for SVG).
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
235
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
236 Example Output
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
237 --------------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
238
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
239 .. image:: $PATH_TO_IMAGES/P51587.svg.png
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
240
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
241 .. _InterProScan: http://www.ebi.ac.uk/interpro
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
242
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
243
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
244 ----------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
245 References
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
246 ----------
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
247
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
248 Zdobnov EM, Apweiler R (2001)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
249 InterProScan an integration platform for the signature-recognition methods in InterPro.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
250 Bioinformatics 17, 847-848.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
251 http://dx.doi.org/10.1093/bioinformatics/17.9.847
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
252
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
253 Quevillon E, Silventoinen V, Pillai S, Harte N, Mulder N, Apweiler R, Lopez R (2005)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
254 InterProScan: protein domains identifier.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
255 Nucleic Acids Research 33 (Web Server issue), W116-W120.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
256 http://dx.doi.org/10.1093/nar/gki442
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
257
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
258 Hunter S, Apweiler R, Attwood TK, Bairoch A, Bateman A, Binns D, Bork P, Das U, Daugherty L, Duquenne L, Finn RD, Gough J, Haft D, Hulo N, Kahn D, Kelly E, Laugraud A, Letunic I, Lonsdale D, Lopez R, Madera M, Maslen J, McAnulla C, McDowall J, Mistry J, Mitchell A, Mulder N, Natale D, Orengo C, Quinn AF, Selengut JD, Sigrist CJ, Thimma M, Thomas PD, Valentin F, Wilson D, Wu CH, Yeats C. (2009)
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
259 InterPro: the integrative protein signature database.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
260 Nucleic Acids Research 37 (Database Issue), D224-228.
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
261 http://dx.doi.org/10.1093/nar/gkn785
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
262
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
263
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
264 This wrapper is available to install into other Galaxy Instances via the Galaxy Tool Shed at
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
265 http://toolshed.g2.bx.psu.edu/view/bgruening/interproscan
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
266
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
267
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
268 **Galaxy Wrapper Author**::
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
269
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
270 * Bjoern Gruening, Pharmaceutical Bioinformatics, University of Freiburg
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
271 * Konrad Paszkiewicz, Exeter Sequencing Service, University of Exeter
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
272
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
273 </help>
98c6e970cbc1 Uploaded
bgruening
parents:
diff changeset
274 </tool>