annotate glimmer2seq.py @ 0:7ac31bffa17e draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
author iuc
date Tue, 28 Nov 2017 09:55:59 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
1 #!/usr/bin/env python
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
2 """
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
3 Input: DNA FASTA file + Glimmer ORF file
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
4 Output: ORF sequences as FASTA file
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
5 Author: Bjoern Gruening
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
6 """
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
7 import sys
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
8
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
9 from Bio import SeqIO
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
10 from Bio.SeqRecord import SeqRecord
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
11
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
12
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
13 def glimmer2seq(glimmer_prediction=sys.argv[1], genome_sequence=sys.argv[2], outfile=sys.argv[3]):
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
14 if len(sys.argv) >= 4:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
15 glimmerfile = open(glimmer_prediction, "r")
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
16 sequence = open(genome_sequence)
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
17 else:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
18 print("Missing input values.")
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
19 sys.exit()
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
20
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
21 fastafile = SeqIO.parse(sequence, "fasta")
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
22
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
23 sequences = dict()
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
24 seq_records = list()
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
25 for entry in fastafile:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
26 sequences[entry.description] = entry
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
27
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
28 for line in glimmerfile:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
29 if line.startswith('>'):
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
30 entry = sequences[line[1:].strip()]
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
31 else:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
32 orf_start = int(line[8:17])
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
33 orf_end = int(line[18:26])
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
34
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
35 orf_name = line[0:8]
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
36 if orf_start <= orf_end:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
37 seq_records.append(SeqRecord(entry.seq[orf_start - 1:orf_end], id=orf_name, description=entry.description))
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
38 else:
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
39 seq_records.append(SeqRecord(entry.seq[orf_end - 1:orf_start].reverse_complement(), id=orf_name, description=entry.description))
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
40
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
41 SeqIO.write(seq_records, outfile, "fasta")
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
42 glimmerfile.close()
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
43 sequence.close()
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
44
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
45
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
46 if __name__ == "__main__":
7ac31bffa17e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
iuc
parents:
diff changeset
47 glimmer2seq()