Galaxy |

Changeset 0:6b5153d02ac2 (2014-11-01)

Next changeset 1:a5ef7a9e5cb7 (2014-11-04)

Commit message:
Uploaded

added:
README.txt
genbanktofasta.py
genbanktofasta.xml
repository_dependencies.xml

diff -r 000000000000 -r 6b5153d02ac2 README.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.txt Sat Nov 01 10:34:38 2014 -0400

@@ -0,0 +1,15 @@
+
+----------------
+GenBank to FASTA
+----------------
+
+This package contains the GenBank to FASTA converter.
+
+--------------------------------------------------------------------
+Instructions for integration of the "GenBank to FASTA" tool into the workflow-system
+Galaxy (http://getgalaxy.org)
+--------------------------------------------------------------------
+
+For best results, we recommand you to install it via the toolshed.
+
+

diff -r 000000000000 -r 6b5153d02ac2 genbanktofasta.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/genbanktofasta.py Sat Nov 01 10:34:38 2014 -0400

[

@@ -0,0 +1,40 @@
+#!/usr/bin/env python
+"""
+Input: genbank file
+Output: fasta nucleotide or protein sequences
+This bit of code will record the full DNA nucleotide sequence for each record in the GenBank file as a fasta record.
+http://www.warwick.ac.uk/go/peter_cock/python/genbank2fasta/
+"""
+
+import sys, os
+from Bio import SeqIO
+
+
+def __main__():
+
+    infile = sys.argv[1]
+    outfile= sys.argv[2]
+    input_handle  = open(infile, "r")
+    output_handle = open(outfile, "w")
+    gbk_to_fna(input_handle,output_handle)
+
+
+#Short version:
+#SeqIO.write(SeqIO.parse(input_handle, "genbank"), output_handle, "fasta")
+#Long version, allows full control of fasta output
+
+def gbk_to_fna(input_handle,output_handle):
+    for seq_record in SeqIO.parse(input_handle, "genbank") :
+        print "Dealing with GenBank record %s" % seq_record.id
+        output_handle.write(">%s %s\n%s\n" % (
+               seq_record.id,
+               seq_record.description,
+               seq_record.seq.tostring()))
+    output_handle.close()
+    input_handle.close()
+    print "Done"
+
+
+
+if __name__ == "__main__" : __main__()
+

diff -r 000000000000 -r 6b5153d02ac2 genbanktofasta.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/genbanktofasta.xml Sat Nov 01 10:34:38 2014 -0400

[

@@ -0,0 +1,50 @@
+<tool id="genbank_to_fa" name="Converting GenBank files" version="1.0.0">
+
+    
+    <description>to Fasta format</description>
+
+    
+    <requirements>
+     <requirement type="binary">python</requirement>
+    </requirements>
+
+    <command interpreter="python">
+        genbanktofasta.py $input $output
+    </command>
+
+    
+    <inputs>
+        <param name="input" type="data" format="genbank" label="Your Genbank input file" help="" />
+    </inputs>
+
+    
+    <outputs>
+        <data name="output" format="fasta" label="${input.name}.fasta" /> 
+    </outputs>
+
+    
+    <stdio>
+        
+        <exit_code range="1:" level="fatal" />
+    </stdio>
+
+
+    
+    <help>
+
+
+================
+GenBank to Fasta
+================
+
+-----------
+Description
+-----------
+
+ | This tool converts a GenBank file to FASTA nucleotides format.
+ | Reference: http://www.warwick.ac.uk/go/peter_cock/python/genbank2fasta/
+
+
+    </help>
+
+</tool>

diff -r 000000000000 -r 6b5153d02ac2 repository_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml Sat Nov 01 10:34:38 2014 -0400

@@ -0,0 +1,4 @@
+<?xml version="1.0"?>
+<repositories description="GenBank to FASTA tool requires the Galaxy applicable data format GenBank">
+ <repository changeset_revision="a4a890259b82" name="genbank_complete_datatype" owner="mons" toolshed="https://testtoolshed.g2.bx.psu.edu" />
+</repositories>