annotate gene_family_integrator.py @ 6:1d178e90fbe6 draft

Uploaded
author greg
date Mon, 10 Apr 2017 11:30:34 -0400
parents d06e3ae4eb5a
children 0bf47f620170
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
109a0eb7791f Uploaded
greg
parents:
diff changeset
1 #!/usr/bin/env python
109a0eb7791f Uploaded
greg
parents:
diff changeset
2 import argparse
109a0eb7791f Uploaded
greg
parents:
diff changeset
3 import subprocess
109a0eb7791f Uploaded
greg
parents:
diff changeset
4
1
f53cafa72117 Uploaded
greg
parents: 0
diff changeset
5 import utils
0
109a0eb7791f Uploaded
greg
parents:
diff changeset
6
109a0eb7791f Uploaded
greg
parents:
diff changeset
7 OUTPUT_DIR = 'integratedGeneFamilies_dir'
109a0eb7791f Uploaded
greg
parents:
diff changeset
8
109a0eb7791f Uploaded
greg
parents:
diff changeset
9 parser = argparse.ArgumentParser()
109a0eb7791f Uploaded
greg
parents:
diff changeset
10 parser.add_argument('--orthogroup_faa', dest='orthogroup_faa', help="Directory of input fasta datasets")
6
1d178e90fbe6 Uploaded
greg
parents: 3
diff changeset
11 parser.add_argument('--scaffold', dest='scaffold', help='Orthogroups or gene families proteins scaffold')
0
109a0eb7791f Uploaded
greg
parents:
diff changeset
12 parser.add_argument('--method', dest='method', help='Protein clustering method')
109a0eb7791f Uploaded
greg
parents:
diff changeset
13 parser.add_argument('--orthogroup_fna', dest='orthogroup_fna', default=None, help='Use correspong coding sequences')
109a0eb7791f Uploaded
greg
parents:
diff changeset
14 parser.add_argument('--output', dest='output', help="Output dataset")
109a0eb7791f Uploaded
greg
parents:
diff changeset
15 parser.add_argument('--output_dir', dest='output_dir', help="Output dataset file_path directory")
109a0eb7791f Uploaded
greg
parents:
diff changeset
16
109a0eb7791f Uploaded
greg
parents:
diff changeset
17 args = parser.parse_args()
109a0eb7791f Uploaded
greg
parents:
diff changeset
18
109a0eb7791f Uploaded
greg
parents:
diff changeset
19 # Build the command line.
109a0eb7791f Uploaded
greg
parents:
diff changeset
20 cmd = 'GeneFamilyIntegrator'
3
d06e3ae4eb5a Uploaded
greg
parents: 1
diff changeset
21 cmd += ' --orthogroup_faa %s' % args.orthogroup_faa
0
109a0eb7791f Uploaded
greg
parents:
diff changeset
22 cmd += ' --scaffold %s' % args.scaffold
109a0eb7791f Uploaded
greg
parents:
diff changeset
23 cmd += ' --method %s' % args.method
109a0eb7791f Uploaded
greg
parents:
diff changeset
24 if args.orthogroup_fna is not None:
109a0eb7791f Uploaded
greg
parents:
diff changeset
25 cmd += ' --orthogroup_fna'
109a0eb7791f Uploaded
greg
parents:
diff changeset
26 # Run the command.
109a0eb7791f Uploaded
greg
parents:
diff changeset
27 proc = subprocess.Popen(args=cmd, stderr=subprocess.PIPE, stdout=subprocess.PIPE, shell=True)
109a0eb7791f Uploaded
greg
parents:
diff changeset
28 rc = proc.wait()
109a0eb7791f Uploaded
greg
parents:
diff changeset
29 utils.check_execution_errors(rc, proc.stderr)
6
1d178e90fbe6 Uploaded
greg
parents: 3
diff changeset
30 utils.move_directory_files(os.path.join(OUTPUT_DIR, 'orthogroups_fasta'), args.output_dir)
0
109a0eb7791f Uploaded
greg
parents:
diff changeset
31 utils.write_html_output(args.output, 'Integrated gene family sequences', args.output_dir)