# HG changeset patch
# User greg
# Date 1457034767 18000
# Node ID ec35e8d25958babaa54714a6c46beb618f676b57
# Parent 24c055f480651e71902c11b30480c6268ab99fb0
Uploaded
diff -r 24c055f48065 -r ec35e8d25958 extract_genomic_dna.xml
--- a/extract_genomic_dna.xml Thu Mar 03 14:52:35 2016 -0500
+++ b/extract_genomic_dna.xml Thu Mar 03 14:52:47 2016 -0500
@@ -28,7 +28,10 @@
#end if
--output_format $output_format_cond.output_format
#if str($output_format_cond.output_format) == "fasta":
- --description_field_delimiter $output_format_cond.description_field_delimiter
+ --fasta_header_type $output_format_cond.fasta_header_type_cond.fasta_header_type
+ #if str($output_format_cond.fasta_header_type_cond.fasta_header_type) == "char_delimited":
+ --fasta_header_delimiter $output_format_cond.fasta_header_type_cond.fasta_header_delimiter
+ #end if
#end if
--output $output
]]>
@@ -69,13 +72,22 @@
-
-
-
-
-
-
-
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
@@ -93,7 +105,8 @@
-
+
+
@@ -101,7 +114,8 @@
-
+
+
@@ -124,7 +138,8 @@
-
+
+
@@ -134,7 +149,8 @@
-
+
+
@@ -143,7 +159,7 @@
-
+
@@ -170,14 +186,27 @@
**What it does**
This tool uses coordinate, strand, and build information to fetch genomic DNAs in FASTA or interval format.
-If the output format is FASTA, the character delimiter can be selected for the fields in the description.
-For example, selecting an underscore will produce a description like this:
+If the output format is FASTA, the header format can be specified.
+
+Selecting the **bedtools getfasta default** option produces a FASTA heder formatted like the default header
+produced the the bedtools getfasta tool, and the "force strandedness" option is assumed. If the input data
+includes a strand column and the strand is '+' or '-', it is included in the header. If the input data includes
+a strand column and the value of strand is anything but '+' or '-', a '.' is included in the header. If the
+input data does not include a strand column, a '.' is included in the header.
- >gi_31563518_ref_NP_852610.1
+An example FASTA header produced by selecting this option is:
+
+ >chr7:127475281-127475310(+)
+
+Selecing the **character delimited field values** option allows selection of a character delimiter that is used
+when generating the FASTA header with fields genome, chrom, start, end, strand (name) delimited by the
+selected character. For example, selecting an underscore will produce a FASTA header like this:
+
+ >mm9_53_550_+ test_chromosome
while selecting a vertical bar will produce a description like this:
- >gi|31563518|ref|NP_852610.1
+ >mm9|53|550|+ test_chromosome
If strand is not defined, the default value is "+".