comparison tools/mira4_0/mira4_convert.py @ 31:fd95aaef8818 draft

planemo upload for repository https://github.com/peterjc/galaxy_mira/tree/master/tools/mira4_0 commit bc3d484c5cd68ddcf456db2fff489d584aa2034c
author peterjc
date Wed, 10 Feb 2016 09:07:39 -0500
parents 55ae131c5862
children 56b421d59805
comparison
equal deleted inserted replaced
30:b506e3b779fa 31:fd95aaef8818
5 """ 5 """
6 import os 6 import os
7 import sys 7 import sys
8 import subprocess 8 import subprocess
9 import shutil 9 import shutil
10 import time
11 import tempfile
12 from optparse import OptionParser 10 from optparse import OptionParser
13 try: 11 try:
14 from io import BytesIO 12 from io import BytesIO
15 except ImportError: 13 except ImportError:
16 #Should we worry about Python 2.5 or older? 14 #Should we worry about Python 2.5 or older?
19 #Do we need any PYTHONPATH magic? 17 #Do we need any PYTHONPATH magic?
20 from mira4_make_bam import depad 18 from mira4_make_bam import depad
21 19
22 WRAPPER_VER = "0.0.7" # Keep in sync with the XML file 20 WRAPPER_VER = "0.0.7" # Keep in sync with the XML file
23 21
24 def sys_exit(msg, err=1):
25 sys.stderr.write(msg+"\n")
26 sys.exit(err)
27 22
28 def run(cmd): 23 def run(cmd):
29 #Avoid using shell=True when we call subprocess to ensure if the Python 24 #Avoid using shell=True when we call subprocess to ensure if the Python
30 #script is killed, so too is the child process. 25 #script is killed, so too is the child process.
31 try: 26 try:
32 child = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE) 27 child = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
33 except Exception, err: 28 except Exception, err:
34 sys_exit("Error invoking command:\n%s\n\n%s\n" % (" ".join(cmd), err)) 29 sys.exit("Error invoking command:\n%s\n\n%s\n" % (" ".join(cmd), err))
35 #Use .communicate as can get deadlocks with .wait(), 30 #Use .communicate as can get deadlocks with .wait(),
36 stdout, stderr = child.communicate() 31 stdout, stderr = child.communicate()
37 return_code = child.returncode 32 return_code = child.returncode
38 if return_code: 33 if return_code:
39 cmd_str = " ".join(cmd) # doesn't quote spaces etc 34 cmd_str = " ".join(cmd) # doesn't quote spaces etc
40 if stderr and stdout: 35 if stderr and stdout:
41 sys_exit("Return code %i from command:\n%s\n\n%s\n\n%s" % (return_code, cmd_str, stdout, stderr)) 36 sys.exit("Return code %i from command:\n%s\n\n%s\n\n%s" % (return_code, cmd_str, stdout, stderr))
42 else: 37 else:
43 sys_exit("Return code %i from command:\n%s\n%s" % (return_code, cmd_str, stderr)) 38 sys.exit("Return code %i from command:\n%s\n%s" % (return_code, cmd_str, stderr))
44 39
45 def get_version(mira_binary): 40 def get_version(mira_binary):
46 """Run MIRA to find its version number""" 41 """Run MIRA to find its version number"""
47 # At the commend line I would use: mira -v | head -n 1 42 # At the commend line I would use: mira -v | head -n 1
48 # however there is some pipe error when doing that here. 43 # however there is some pipe error when doing that here.
96 parser.add_option("-v", "--version", dest="version", 91 parser.add_option("-v", "--version", dest="version",
97 default=False, action="store_true", 92 default=False, action="store_true",
98 help="Show version and quit") 93 help="Show version and quit")
99 options, args = parser.parse_args() 94 options, args = parser.parse_args()
100 if args: 95 if args:
101 sys_exit("Expected options (e.g. --input example.maf), not arguments") 96 sys.exit("Expected options (e.g. --input example.maf), not arguments")
102 97
103 input_maf = options.input 98 input_maf = options.input
104 out_maf = options.maf 99 out_maf = options.maf
105 out_bam = options.bam 100 out_bam = options.bam
106 out_fasta = options.fasta 101 out_fasta = options.fasta
108 out_cstats = options.cstats 103 out_cstats = options.cstats
109 104
110 try: 105 try:
111 mira_path = os.environ["MIRA4"] 106 mira_path = os.environ["MIRA4"]
112 except KeyError: 107 except KeyError:
113 sys_exit("Environment variable $MIRA4 not set") 108 sys.exit("Environment variable $MIRA4 not set")
114 mira_convert = os.path.join(mira_path, "miraconvert") 109 mira_convert = os.path.join(mira_path, "miraconvert")
115 if not os.path.isfile(mira_convert): 110 if not os.path.isfile(mira_convert):
116 sys_exit("Missing miraconvert under $MIRA4, %r\nFolder contained: %s" 111 sys.exit("Missing miraconvert under $MIRA4, %r\nFolder contained: %s"
117 % (mira_convert, ", ".join(os.listdir(mira_path)))) 112 % (mira_convert, ", ".join(os.listdir(mira_path))))
118 113
119 mira_convert_ver = get_version(mira_convert) 114 mira_convert_ver = get_version(mira_convert)
120 if not mira_convert_ver.strip().startswith("4.0"): 115 if not mira_convert_ver.strip().startswith("4.0"):
121 sys_exit("This wrapper is for MIRA V4.0, not:\n%s\n%s" % (mira_convert_ver, mira_convert)) 116 sys.exit("This wrapper is for MIRA V4.0, not:\n%s\n%s" % (mira_convert_ver, mira_convert))
122 if options.version: 117 if options.version:
123 print("%s, MIRA wrapper version %s" % (mira_convert_ver, WRAPPER_VER)) 118 print("%s, MIRA wrapper version %s" % (mira_convert_ver, WRAPPER_VER))
124 sys.exit(0) 119 sys.exit(0)
125 120
126 if not input_maf: 121 if not input_maf:
127 sys_exit("Input MIRA file is required") 122 sys.exit("Input MIRA file is required")
128 elif not os.path.isfile(input_maf): 123 elif not os.path.isfile(input_maf):
129 sys_exit("Missing input MIRA file: %r" % input_maf) 124 sys.exit("Missing input MIRA file: %r" % input_maf)
130 125
131 if not (out_maf or out_bam or out_fasta or out_ace or out_cstats): 126 if not (out_maf or out_bam or out_fasta or out_ace or out_cstats):
132 sys_exit("No output requested") 127 sys.exit("No output requested")
133 128
134 129
135 def check_min_int(value, name): 130 def check_min_int(value, name):
136 try: 131 try:
137 i = int(value) 132 i = int(value)
138 except: 133 except ValueError:
139 sys_exit("Bad %s setting, %r" % (name, value)) 134 sys.exit("Bad %s setting, %r" % (name, value))
140 if i < 0: 135 if i < 0:
141 sys_exit("Negative %s setting, %r" % (name, value)) 136 sys.exit("Negative %s setting, %r" % (name, value))
142 return i 137 return i
143 138
144 min_length = check_min_int(options.min_length, "minimum length") 139 min_length = check_min_int(options.min_length, "minimum length")
145 min_cover = check_min_int(options.min_cover, "minimum cover") 140 min_cover = check_min_int(options.min_cover, "minimum cover")
146 min_reads = check_min_int(options.min_reads, "minimum reads") 141 min_reads = check_min_int(options.min_reads, "minimum reads")
174 cmd_list.append("cstats") 169 cmd_list.append("cstats")
175 run(cmd_list) 170 run(cmd_list)
176 171
177 def collect(old, new): 172 def collect(old, new):
178 if not os.path.isfile(old): 173 if not os.path.isfile(old):
179 sys_exit("Missing expected output file %s" % old) 174 sys.exit("Missing expected output file %s" % old)
180 shutil.move(old, new) 175 shutil.move(old, new)
181 176
182 if out_maf: 177 if out_maf:
183 collect(os.path.join(temp, "converted.maf"), out_maf) 178 collect(os.path.join(temp, "converted.maf"), out_maf)
184 if out_fasta: 179 if out_fasta:
188 collect(old, out_fasta) 183 collect(old, out_fasta)
189 else: 184 else:
190 #Might the output be filtered down to zero contigs? 185 #Might the output be filtered down to zero contigs?
191 old = os.path.join(temp, "converted.fasta") 186 old = os.path.join(temp, "converted.fasta")
192 if not os.path.isfile(old): 187 if not os.path.isfile(old):
193 sys_exit("Missing expected output FASTA file") 188 sys.exit("Missing expected output FASTA file")
194 elif os.path.getsize(old) == 0: 189 elif os.path.getsize(old) == 0:
195 print("Warning - no contigs (harsh filters?)") 190 print("Warning - no contigs (harsh filters?)")
196 collect(old, out_fasta) 191 collect(old, out_fasta)
197 else: 192 else:
198 sys_exit("Missing expected output FASTA file (only generic file present)") 193 sys.exit("Missing expected output FASTA file (only generic file present)")
199 if out_ace: 194 if out_ace:
200 collect(os.path.join(temp, "converted.maf"), out_ace) 195 collect(os.path.join(temp, "converted.maf"), out_ace)
201 if out_cstats: 196 if out_cstats:
202 collect(os.path.join(temp, "converted_info_contigstats.txt"), out_cstats) 197 collect(os.path.join(temp, "converted_info_contigstats.txt"), out_cstats)
203 198
205 assert os.path.isfile(out_fasta) 200 assert os.path.isfile(out_fasta)
206 old = os.path.join(temp, "converted.samnbb") 201 old = os.path.join(temp, "converted.samnbb")
207 if not os.path.isfile(old): 202 if not os.path.isfile(old):
208 old = os.path.join(temp, "converted.sam") 203 old = os.path.join(temp, "converted.sam")
209 if not os.path.isfile(old): 204 if not os.path.isfile(old):
210 sys_exit("Missing expected intermediate file %s" % old) 205 sys.exit("Missing expected intermediate file %s" % old)
211 h = BytesIO() 206 h = BytesIO()
212 msg = depad(out_fasta, old, out_bam, h) 207 msg = depad(out_fasta, old, out_bam, h)
213 if msg: 208 if msg:
214 print(msg) 209 print(msg)
215 print(h.getvalue()) 210 print(h.getvalue())