Mercurial > repos > iuc > bedtools
comparison getfastaBed.xml @ 4:315929597efb draft
Uploaded
| author | iuc |
|---|---|
| date | Wed, 07 Jan 2015 12:45:05 -0500 |
| parents | 7511823bdea1 |
| children |
comparison
equal
deleted
inserted
replaced
| 3:190a747ddaa8 | 4:315929597efb |
|---|---|
| 4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
| 5 </macros> | 5 </macros> |
| 6 <expand macro="requirements" /> | 6 <expand macro="requirements" /> |
| 7 <expand macro="stdio" /> | 7 <expand macro="stdio" /> |
| 8 <command> | 8 <command> |
| 9 <![CDATA[ | |
| 9 bedtools getfasta | 10 bedtools getfasta |
| 10 $name | 11 $name |
| 11 $tab | 12 $tab |
| 12 $strand | 13 $strand |
| 13 $split | 14 $split |
| 14 -fi $fasta | 15 -fi $fasta |
| 15 -bed $inputA | 16 -bed $input |
| 16 -fo $output | 17 -fo $output |
| 18 ]]> | |
| 17 </command> | 19 </command> |
| 18 <inputs> | 20 <inputs> |
| 19 <param format="bed,vcf,gff,gff3" name="inputA" type="data" label="BED/VCF/GFF file" /> | 21 <param format="bed,vcf,gff,gff3" name="input" type="data" label="BED/VCF/GFF file" /> |
| 20 <param format="fasta" name="fasta" type="data" label="Fasta file" /> | 22 <param format="fasta" name="fasta" type="data" label="Fasta file" /> |
| 21 <param name="name" type="boolean" checked="false" truevalue="-name" falsevalue="" label="Use the “name” column in the BED file for the FASTA headers in the output FASTA file" /> | 23 <param name="name" type="boolean" checked="false" truevalue="-name" falsevalue="" |
| 22 <param name="tab" type="boolean" checked="false" truevalue="-tab" falsevalue="" label="Report extract sequences in a tab-delimited format instead of in FASTA format" /> | 24 label="Use the 'name' column in the BED file for the FASTA headers in the output FASTA file" |
| 23 <param name="strand" type="boolean" checked="false" truevalue="-s" falsevalue="" label="Force strandedness" help="If the feature occupies the antisense strand, the sequence will be reverse complemented." /> | 25 help="(-name)" /> |
| 24 <param name="split" type="boolean" checked="false" truevalue="-split" falsevalue="" label="Given BED12 input, extract and concatenate the sequences from the BED 'blocks' (e.g., exons)" /> | 26 <param name="tab" type="boolean" checked="false" truevalue="-tab" falsevalue="" |
| 27 label="Report extract sequences in a tab-delimited format instead of in FASTA format" | |
| 28 help="(-tab)" /> | |
| 29 <param name="strand" type="boolean" checked="false" truevalue="-s" falsevalue="" | |
| 30 label="Force strandedness" | |
| 31 help="If the feature occupies the antisense strand, the sequence will be reverse complemented. (-s)" /> | |
| 32 <expand macro="split" /> | |
| 25 </inputs> | 33 </inputs> |
| 26 <outputs> | 34 <outputs> |
| 27 <data format="fasta" name="output" /> | 35 <data format="fasta" name="output"> |
| 36 <change_format> | |
| 37 <when input="tab" value="-tab" format="tabular" /> | |
| 38 </change_format> | |
| 39 </data> | |
| 28 </outputs> | 40 </outputs> |
| 41 <tests> | |
| 42 <test> | |
| 43 <param name="input" value="nucBed1.bed" ftype="bed" /> | |
| 44 <param name="fasta" value="nucBed1.fasta" ftype="fasta" /> | |
| 45 <param name="tab" value="False" /> | |
| 46 <param name="split" value="False" /> | |
| 47 <output name="output" file="getfastaBed_result1.bed" ftype="fasta" /> | |
| 48 </test> | |
| 49 <test> | |
| 50 <param name="input" value="nucBed1.bed" ftype="bed" /> | |
| 51 <param name="fasta" value="nucBed1.fasta" ftype="fasta" /> | |
| 52 <param name="tab" value="True" /> | |
| 53 <param name="split" value="False" /> | |
| 54 <output name="output" file="getfastaBed_result2.tabular" ftype="tabular" /> | |
| 55 </test> | |
| 56 </tests> | |
| 29 <help> | 57 <help> |
| 58 <![CDATA[ | |
| 30 **What it does** | 59 **What it does** |
| 31 | 60 |
| 32 bedtools getfasta will extract the sequence defined by the coordinates in a BED interval and create a new FASTA entry in the output file for each extracted sequence. By default, the FASTA header for each extracted sequence will be formatted as follows: “<chrom>:<start>-<end>”. | 61 bedtools getfasta will extract the sequence defined by the coordinates in a BED interval and create a new FASTA entry in the output file for each extracted sequence. By default, the FASTA header for each extracted sequence will be formatted as follows: “>chrom>:<start>-<end>”. |
| 33 | 62 |
| 34 .. image:: $PATH_TO_IMAGES/getfasta-glyph.png | 63 .. image:: $PATH_TO_IMAGES/getfasta-glyph.png |
| 35 | 64 |
| 36 .. class:: warningmark | 65 .. class:: warningmark |
| 37 | 66 |
| 38 1. The headers in the input FASTA file must exactly match the chromosome column in the BED file. | 67 1. The headers in the input FASTA file must exactly match the chromosome column in the BED file. |
| 39 | 68 |
| 40 2. You can use the UNIX fold command to set the line width of the FASTA output. For example, fold -w 60 will make each line of the FASTA file have at most 60 nucleotides for easy viewing. | 69 2. You can use the UNIX fold command to set the line width of the FASTA output. For example, fold -w 60 will make each line of the FASTA file have at most 60 nucleotides for easy viewing. |
| 41 | 70 |
| 42 @REFERENCES@ | 71 @REFERENCES@ |
| 72 ]]> | |
| 43 </help> | 73 </help> |
| 44 <expand macro="citations" /> | 74 <expand macro="citations" /> |
| 45 </tool> | 75 </tool> |
