annotate bamFingerprint.xml @ 6:5742b322f956 draft default tip

Uploaded
author greg
date Tue, 10 Dec 2013 10:09:39 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
5742b322f956 Uploaded
greg
parents:
diff changeset
1 <tool id="deeptools_bamFingerprint" name="bamFingerprint" version="1.0">
5742b322f956 Uploaded
greg
parents:
diff changeset
2 <description>plots profiles of BAM files; useful for assesing ChIP signal strength</description>
5742b322f956 Uploaded
greg
parents:
diff changeset
3 <expand macro="requirements" />
5742b322f956 Uploaded
greg
parents:
diff changeset
4 <macros>
5742b322f956 Uploaded
greg
parents:
diff changeset
5 <import>deepTools_macros.xml</import>
5742b322f956 Uploaded
greg
parents:
diff changeset
6 </macros>
5742b322f956 Uploaded
greg
parents:
diff changeset
7 <command>
5742b322f956 Uploaded
greg
parents:
diff changeset
8 #import tempfile
5742b322f956 Uploaded
greg
parents:
diff changeset
9 #set $temp_dir = os.path.abspath(tempfile.mkdtemp())
5742b322f956 Uploaded
greg
parents:
diff changeset
10
5742b322f956 Uploaded
greg
parents:
diff changeset
11 #set files=[]
5742b322f956 Uploaded
greg
parents:
diff changeset
12 #set labels=[]
5742b322f956 Uploaded
greg
parents:
diff changeset
13
5742b322f956 Uploaded
greg
parents:
diff changeset
14 @multiple_input_bams@
5742b322f956 Uploaded
greg
parents:
diff changeset
15
5742b322f956 Uploaded
greg
parents:
diff changeset
16 bamFingerprint
5742b322f956 Uploaded
greg
parents:
diff changeset
17
5742b322f956 Uploaded
greg
parents:
diff changeset
18 @THREADS@
5742b322f956 Uploaded
greg
parents:
diff changeset
19
5742b322f956 Uploaded
greg
parents:
diff changeset
20 --bamfiles #echo " ".join($files)
5742b322f956 Uploaded
greg
parents:
diff changeset
21 --labels #echo " ".join($labels)
5742b322f956 Uploaded
greg
parents:
diff changeset
22
5742b322f956 Uploaded
greg
parents:
diff changeset
23 --fragmentLength $fragmentLength
5742b322f956 Uploaded
greg
parents:
diff changeset
24
5742b322f956 Uploaded
greg
parents:
diff changeset
25 #set newoutFileName=str($outFileName)+".png"
5742b322f956 Uploaded
greg
parents:
diff changeset
26 --plotFile $newoutFileName
5742b322f956 Uploaded
greg
parents:
diff changeset
27
5742b322f956 Uploaded
greg
parents:
diff changeset
28 #if $outputOpt.showOutputOpt == "yes"
5742b322f956 Uploaded
greg
parents:
diff changeset
29 #if $outputOpt.saveRawCounts:
5742b322f956 Uploaded
greg
parents:
diff changeset
30 --outRawCounts '$outFileRawCounts'
5742b322f956 Uploaded
greg
parents:
diff changeset
31 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
32 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
33
5742b322f956 Uploaded
greg
parents:
diff changeset
34 #if $advancedOpt.showAdvancedOpt == "yes":
5742b322f956 Uploaded
greg
parents:
diff changeset
35
5742b322f956 Uploaded
greg
parents:
diff changeset
36 #if str($advancedOpt.region.value) != '':
5742b322f956 Uploaded
greg
parents:
diff changeset
37 --region '$advancedOpt.region'
5742b322f956 Uploaded
greg
parents:
diff changeset
38 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
39
5742b322f956 Uploaded
greg
parents:
diff changeset
40 --binSize '$advancedOpt.binSize'
5742b322f956 Uploaded
greg
parents:
diff changeset
41 --numberOfSamples '$advancedOpt.numberOfSamples'
5742b322f956 Uploaded
greg
parents:
diff changeset
42
5742b322f956 Uploaded
greg
parents:
diff changeset
43 $advancedOpt.doNotExtendPairedEnds
5742b322f956 Uploaded
greg
parents:
diff changeset
44 $advancedOpt.ignoreDuplicates
5742b322f956 Uploaded
greg
parents:
diff changeset
45 $advancedOpt.skipZeros
5742b322f956 Uploaded
greg
parents:
diff changeset
46
5742b322f956 Uploaded
greg
parents:
diff changeset
47 #if $advancedOpt.minMappingQuality:
5742b322f956 Uploaded
greg
parents:
diff changeset
48 --minMappingQuality '$advancedOpt.minMappingQuality'
5742b322f956 Uploaded
greg
parents:
diff changeset
49 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
50 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
51 ; mv $newoutFileName $outFileName
5742b322f956 Uploaded
greg
parents:
diff changeset
52 ; rm $temp_dir -rf
5742b322f956 Uploaded
greg
parents:
diff changeset
53 </command>
5742b322f956 Uploaded
greg
parents:
diff changeset
54
5742b322f956 Uploaded
greg
parents:
diff changeset
55 <inputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
56 <expand macro="multiple_input_bams" />
5742b322f956 Uploaded
greg
parents:
diff changeset
57
5742b322f956 Uploaded
greg
parents:
diff changeset
58 <param name="fragmentLength" type="integer" value="200" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
59 label="Length of the average fragment size"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
60 <conditional name="advancedOpt">
5742b322f956 Uploaded
greg
parents:
diff changeset
61 <param name="showAdvancedOpt" type="select" label="Show advanced options" >
5742b322f956 Uploaded
greg
parents:
diff changeset
62 <option value="no" selected="true">no</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
63 <option value="yes">yes</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
64 </param>
5742b322f956 Uploaded
greg
parents:
diff changeset
65 <when value="no" />
5742b322f956 Uploaded
greg
parents:
diff changeset
66 <when value="yes">
5742b322f956 Uploaded
greg
parents:
diff changeset
67 <param name="region" type="text" value=""
5742b322f956 Uploaded
greg
parents:
diff changeset
68 label="Region of the genome to limit the operation to"
5742b322f956 Uploaded
greg
parents:
diff changeset
69 help="This is useful when testing parameters to reduce the computing time. The format is chr:start:end, for example &quot;chr10&quot; or &quot;chr10:456700:891000&quot;" />
5742b322f956 Uploaded
greg
parents:
diff changeset
70
5742b322f956 Uploaded
greg
parents:
diff changeset
71 <param name="binSize" type="integer" value="10000" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
72 label="Bin size in bp"
5742b322f956 Uploaded
greg
parents:
diff changeset
73 help="Length in base pairs for a window used to sample the genome."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
74
5742b322f956 Uploaded
greg
parents:
diff changeset
75 <param name="numberOfSamples" type="integer" value="100000" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
76 label="Number of samples"
5742b322f956 Uploaded
greg
parents:
diff changeset
77 help="Number of samples taken from the genome to compute the scaling factors"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
78
5742b322f956 Uploaded
greg
parents:
diff changeset
79 <param name="doNotExtendPairedEnds" type="boolean" truevalue="--doNotExtendPairedEnds" falsevalue=""
5742b322f956 Uploaded
greg
parents:
diff changeset
80 label="Do not extend paired ends"
5742b322f956 Uploaded
greg
parents:
diff changeset
81 help="If set, reads are not extended to match the fragment length reported in the BAM file, instead they will be extended to match the fragment length. Default is to extend the reads if paired end information is available."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
82
5742b322f956 Uploaded
greg
parents:
diff changeset
83 <param name="ignoreDuplicates" type="boolean" truevalue="--ignoreDuplicates" falsevalue=""
5742b322f956 Uploaded
greg
parents:
diff changeset
84 label="Ignore duplicates"
5742b322f956 Uploaded
greg
parents:
diff changeset
85 help="If set, reads that have the same orientation and start position will be considered only once. If reads are paired, the mate position also has to coincide to ignore a read." />
5742b322f956 Uploaded
greg
parents:
diff changeset
86
5742b322f956 Uploaded
greg
parents:
diff changeset
87 <param name="minMappingQuality" type="integer" optional="true" value="1" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
88 label="Minimum mapping quality"
5742b322f956 Uploaded
greg
parents:
diff changeset
89 help= "If set, only reads that have a mapping quality score higher than the given value are considered. *Note* Bowtie's Mapping quality is related to uniqueness: the higher the score, the more unique is a read. A mapping quality defined by Bowtie of 10 or less indicates that there is at least a 1 in 10 chance that the read truly originated elsewhere."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
90
5742b322f956 Uploaded
greg
parents:
diff changeset
91 <param name="skipZeros" type="boolean" truevalue="--skipZeros" falsevalue=""
5742b322f956 Uploaded
greg
parents:
diff changeset
92 label ="Include zeros"
5742b322f956 Uploaded
greg
parents:
diff changeset
93 help ="If set, then zero counts that happen for *all* BAM files given are ignored. This might have the effect that fewer regions are considered than indicated in the option where the number of samples is defined." />
5742b322f956 Uploaded
greg
parents:
diff changeset
94 </when>
5742b322f956 Uploaded
greg
parents:
diff changeset
95 </conditional>
5742b322f956 Uploaded
greg
parents:
diff changeset
96
5742b322f956 Uploaded
greg
parents:
diff changeset
97 <conditional name="outputOpt">
5742b322f956 Uploaded
greg
parents:
diff changeset
98 <param name="showOutputOpt" type="select" label="Show additional output options" >
5742b322f956 Uploaded
greg
parents:
diff changeset
99 <option value="no" selected="true">no</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
100 <option value="yes">yes</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
101 </param>
5742b322f956 Uploaded
greg
parents:
diff changeset
102 <when value="no" />
5742b322f956 Uploaded
greg
parents:
diff changeset
103 <when value="yes">
5742b322f956 Uploaded
greg
parents:
diff changeset
104 <param name="saveRawCounts" type="boolean" label="Save the bin counts"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
105 </when>
5742b322f956 Uploaded
greg
parents:
diff changeset
106 </conditional>
5742b322f956 Uploaded
greg
parents:
diff changeset
107
5742b322f956 Uploaded
greg
parents:
diff changeset
108 </inputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
109 <outputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
110 <data format="png" name="outFileName" />
5742b322f956 Uploaded
greg
parents:
diff changeset
111 <data format="tabular" name="outFileRawCounts" label="${tool.name} on ${on_string}: bin counts">
5742b322f956 Uploaded
greg
parents:
diff changeset
112 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveRawCounts'] == True)</filter>
5742b322f956 Uploaded
greg
parents:
diff changeset
113 </data>
5742b322f956 Uploaded
greg
parents:
diff changeset
114 </outputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
115 <help>
5742b322f956 Uploaded
greg
parents:
diff changeset
116
5742b322f956 Uploaded
greg
parents:
diff changeset
117 **What it does**
5742b322f956 Uploaded
greg
parents:
diff changeset
118
5742b322f956 Uploaded
greg
parents:
diff changeset
119 This tool is based on a method developed by Diaz et al. (2012). Stat Appl Genet Mol Biol 11(3).
5742b322f956 Uploaded
greg
parents:
diff changeset
120 The resulting plot can be used to assess the strength of a ChIP (for factors that bind to narrow regions).
5742b322f956 Uploaded
greg
parents:
diff changeset
121 The tool first samples indexed BAM files and counts all reads overlapping a window (bin) of specified length.
5742b322f956 Uploaded
greg
parents:
diff changeset
122 These counts are then sorted according to their rank and the cumulative sum of read counts are plotted. An ideal input
5742b322f956 Uploaded
greg
parents:
diff changeset
123 with perfect uniform distribution of reads along the genome (i.e. without enrichments in open chromatin etc.) should
5742b322f956 Uploaded
greg
parents:
diff changeset
124 generate a straight diagonal line. A very specific and strong ChIP enrichment will be indicated by a prominent and steep
5742b322f956 Uploaded
greg
parents:
diff changeset
125 rise of the cumulative sum towards the highest rank. This means that a big chunk of reads from the ChIP sample is located in
5742b322f956 Uploaded
greg
parents:
diff changeset
126 few bins which corresponds to high, narrow enrichments seen for transcription factors.
5742b322f956 Uploaded
greg
parents:
diff changeset
127
5742b322f956 Uploaded
greg
parents:
diff changeset
128
5742b322f956 Uploaded
greg
parents:
diff changeset
129 .. image:: $PATH_TO_IMAGES/QC_fingerprint.png
5742b322f956 Uploaded
greg
parents:
diff changeset
130
5742b322f956 Uploaded
greg
parents:
diff changeset
131
5742b322f956 Uploaded
greg
parents:
diff changeset
132 **Output files**:
5742b322f956 Uploaded
greg
parents:
diff changeset
133
5742b322f956 Uploaded
greg
parents:
diff changeset
134 - Diagnostic plot
5742b322f956 Uploaded
greg
parents:
diff changeset
135 - Data matrix of raw counts
5742b322f956 Uploaded
greg
parents:
diff changeset
136
5742b322f956 Uploaded
greg
parents:
diff changeset
137 -----
5742b322f956 Uploaded
greg
parents:
diff changeset
138
5742b322f956 Uploaded
greg
parents:
diff changeset
139 .. class:: infomark
5742b322f956 Uploaded
greg
parents:
diff changeset
140
5742b322f956 Uploaded
greg
parents:
diff changeset
141 @REFERENCES@
5742b322f956 Uploaded
greg
parents:
diff changeset
142
5742b322f956 Uploaded
greg
parents:
diff changeset
143 </help>
5742b322f956 Uploaded
greg
parents:
diff changeset
144 </tool>