annotate oases_optimiser.py @ 5:58bf34f98232 draft default tip

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
author drosofff
date Fri, 29 Apr 2016 03:14:58 -0400
parents b4d1940ecc90
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
1 #!/usr/bin/env python
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
2
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
3 """
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
4 VelvetOptimiser Wrapper
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
5 refactored using the adaptation of
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
6 Konrad Paszkiewicz University of Exeter, UK.
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
7
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
8 """
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
9 import os, sys
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
10 import subprocess
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
11
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
12
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
13 def stop_err(msg):
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
14 sys.stderr.write("%s\n" % msg)
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
15 sys.exit()
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
16
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
17
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
18 def oases_optimiser(starthash, endhash, input):
3
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
19 '''
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
20 Replaces call to oases_optimiser.sh. For all k-mers between
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
21 starthash and endhash run velvet and oases.
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
22 '''
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
23 for i in xrange(starthash, endhash, 2):
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
24 cmd1 = "velveth outputFolder_{0} {0} {1} && ".format(i, input)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
25 cmd2 = "velvetg outputFolder_{0} -read_trkg yes && ".format(i)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
26 cmd3 = "oases outputFolder_{0}".format(i)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
27 proc = subprocess.call(args=cmd1 + cmd2 + cmd3, shell=True, stdout=sys.stdout, stderr=sys.stdout)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
28 if not proc == 0:
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
29 print("Oases failed at k-mer %s, skipping" % i)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
30 continue
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
31 cmd4 = "velveth MergedAssemblyFolder 27 -long outputFolder_*/transcripts.fa && "
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
32 cmd5 = "velvetg MergedAssemblyFolder -read_trkg yes -conserveLong yes && "
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
33 cmd6 = "oases MergedAssemblyFolder -merge yes"
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
34 proc = subprocess.call(args=cmd4 + cmd5 + cmd6, shell=True, stdout=sys.stdout, stderr=sys.stdout)
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
35 if not proc == 0:
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
36 raise Exception("Oases could not merge assembly")
3
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
37
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
38 def __main__():
3
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
39 starthash = int(sys.argv[1])
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
40 endhash = int(sys.argv[2])
b4d1940ecc90 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents: 0
diff changeset
41 input = sys.argv[3]
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
42 transcripts = sys.argv[4]
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
43 try:
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
44 oases_optimiser(starthash, endhash, input)
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
45 except Exception, e:
5
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
46 stop_err('Error running oases_optimiser.py\n' + str(e))
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
47 with open(transcripts, 'w') as out:
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
48 transcript_path = os.path.join("MergedAssemblyFolder", 'transcripts.fa')
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
49 for line in open(transcript_path):
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
50 out.write("%s" % (line))
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
51
58bf34f98232 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/msp_oases commit 3d96056b65a38e7642cfeef4ed274dc76b88472a
drosofff
parents: 3
diff changeset
52
0
435711ba68e3 planemo upload for repository https://bitbucket.org/drosofff/gedtools/
drosofff
parents:
diff changeset
53 if __name__ == "__main__": __main__()