annotate bamCorrelate.xml @ 6:5742b322f956 draft default tip

Uploaded
author greg
date Tue, 10 Dec 2013 10:09:39 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
5742b322f956 Uploaded
greg
parents:
diff changeset
1 <tool id="deeptools_bamCorrelate" name="bamCorrelate" version="1.0.1">
5742b322f956 Uploaded
greg
parents:
diff changeset
2 <description>correlates pairs of BAM files</description>
5742b322f956 Uploaded
greg
parents:
diff changeset
3 <expand macro="requirements" />
5742b322f956 Uploaded
greg
parents:
diff changeset
4 <macros>
5742b322f956 Uploaded
greg
parents:
diff changeset
5 <import>deepTools_macros.xml</import>
5742b322f956 Uploaded
greg
parents:
diff changeset
6 </macros>
5742b322f956 Uploaded
greg
parents:
diff changeset
7 <command>
5742b322f956 Uploaded
greg
parents:
diff changeset
8 #import tempfile
5742b322f956 Uploaded
greg
parents:
diff changeset
9 #set $temp_dir = os.path.abspath(tempfile.mkdtemp())
5742b322f956 Uploaded
greg
parents:
diff changeset
10
5742b322f956 Uploaded
greg
parents:
diff changeset
11 #set files=[]
5742b322f956 Uploaded
greg
parents:
diff changeset
12 #set labels=[]
5742b322f956 Uploaded
greg
parents:
diff changeset
13
5742b322f956 Uploaded
greg
parents:
diff changeset
14 @multiple_input_bams@
5742b322f956 Uploaded
greg
parents:
diff changeset
15
5742b322f956 Uploaded
greg
parents:
diff changeset
16 bamCorrelate
5742b322f956 Uploaded
greg
parents:
diff changeset
17
5742b322f956 Uploaded
greg
parents:
diff changeset
18 $mode.modeOpt
5742b322f956 Uploaded
greg
parents:
diff changeset
19
5742b322f956 Uploaded
greg
parents:
diff changeset
20 @THREADS@
5742b322f956 Uploaded
greg
parents:
diff changeset
21
5742b322f956 Uploaded
greg
parents:
diff changeset
22 --bamfiles #echo " ".join($files)
5742b322f956 Uploaded
greg
parents:
diff changeset
23 --labels #echo " ".join($labels)
5742b322f956 Uploaded
greg
parents:
diff changeset
24
5742b322f956 Uploaded
greg
parents:
diff changeset
25 --fragmentLength $fragmentLength
5742b322f956 Uploaded
greg
parents:
diff changeset
26 --corMethod $corMethod
5742b322f956 Uploaded
greg
parents:
diff changeset
27
5742b322f956 Uploaded
greg
parents:
diff changeset
28 #set newoutFileName=str($outFileName)+".png"
5742b322f956 Uploaded
greg
parents:
diff changeset
29 --plotFile $newoutFileName
5742b322f956 Uploaded
greg
parents:
diff changeset
30
5742b322f956 Uploaded
greg
parents:
diff changeset
31 #if $outputOpt.showOutputOpt == "yes"
5742b322f956 Uploaded
greg
parents:
diff changeset
32 --outRawCounts '$outFileRawCounts'
5742b322f956 Uploaded
greg
parents:
diff changeset
33 --outFileCorMatrix '$outFileCorMatrix'
5742b322f956 Uploaded
greg
parents:
diff changeset
34 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
35
5742b322f956 Uploaded
greg
parents:
diff changeset
36 #if $mode.modeOpt == "bins":
5742b322f956 Uploaded
greg
parents:
diff changeset
37 --binSize '$mode.binSize'
5742b322f956 Uploaded
greg
parents:
diff changeset
38 --numberOfSamples '$mode.numberOfSamples'
5742b322f956 Uploaded
greg
parents:
diff changeset
39 #else:
5742b322f956 Uploaded
greg
parents:
diff changeset
40 --BED $mode.region_file
5742b322f956 Uploaded
greg
parents:
diff changeset
41 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
42
5742b322f956 Uploaded
greg
parents:
diff changeset
43 ## options available in both modes
5742b322f956 Uploaded
greg
parents:
diff changeset
44 #if $mode.advancedOpt.showAdvancedOpt == "yes":
5742b322f956 Uploaded
greg
parents:
diff changeset
45
5742b322f956 Uploaded
greg
parents:
diff changeset
46 #if str($mode.advancedOpt.region.value) != '':
5742b322f956 Uploaded
greg
parents:
diff changeset
47 --region '$mode.advancedOpt.region'
5742b322f956 Uploaded
greg
parents:
diff changeset
48 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
49
5742b322f956 Uploaded
greg
parents:
diff changeset
50 $mode.advancedOpt.doNotExtendPairedEnds
5742b322f956 Uploaded
greg
parents:
diff changeset
51 $mode.advancedOpt.ignoreDuplicates
5742b322f956 Uploaded
greg
parents:
diff changeset
52 $mode.advancedOpt.includeZeros
5742b322f956 Uploaded
greg
parents:
diff changeset
53
5742b322f956 Uploaded
greg
parents:
diff changeset
54 #if $mode.advancedOpt.minMappingQuality:
5742b322f956 Uploaded
greg
parents:
diff changeset
55 --minMappingQuality '$mode.advancedOpt.minMappingQuality'
5742b322f956 Uploaded
greg
parents:
diff changeset
56 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
57
5742b322f956 Uploaded
greg
parents:
diff changeset
58 #if $mode.advancedOpt.zMin:
5742b322f956 Uploaded
greg
parents:
diff changeset
59 --zMin $mode.advancedOpt.zMin
5742b322f956 Uploaded
greg
parents:
diff changeset
60 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
61 #if $mode.advancedOpt.zMax:
5742b322f956 Uploaded
greg
parents:
diff changeset
62 --zMax $mode.advancedOpt.zMax
5742b322f956 Uploaded
greg
parents:
diff changeset
63 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
64 --colorMap '$mode.advancedOpt.colorMap'
5742b322f956 Uploaded
greg
parents:
diff changeset
65
5742b322f956 Uploaded
greg
parents:
diff changeset
66 #end if
5742b322f956 Uploaded
greg
parents:
diff changeset
67
5742b322f956 Uploaded
greg
parents:
diff changeset
68 ; mv $newoutFileName $outFileName
5742b322f956 Uploaded
greg
parents:
diff changeset
69 ; rm $temp_dir -rf
5742b322f956 Uploaded
greg
parents:
diff changeset
70 </command>
5742b322f956 Uploaded
greg
parents:
diff changeset
71
5742b322f956 Uploaded
greg
parents:
diff changeset
72 <inputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
73 <expand macro="multiple_input_bams" />
5742b322f956 Uploaded
greg
parents:
diff changeset
74
5742b322f956 Uploaded
greg
parents:
diff changeset
75 <param name="fragmentLength" type="integer" value="300" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
76 label="Length of the average fragment size"
5742b322f956 Uploaded
greg
parents:
diff changeset
77 help ="Reads will be extended to match this length unless they are paired-end, in which case they will be extended to match the fragment length. *NOTE*: If the BAM files contain mated and unmated paired-end reads, unmated reads will be extended to match the fragment length."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
78
5742b322f956 Uploaded
greg
parents:
diff changeset
79 <param name="corMethod" type="select" label="Correlation method">
5742b322f956 Uploaded
greg
parents:
diff changeset
80 <option value="pearson">Pearson</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
81 <option value="spearman">Spearman</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
82 </param>
5742b322f956 Uploaded
greg
parents:
diff changeset
83
5742b322f956 Uploaded
greg
parents:
diff changeset
84 <conditional name="mode">
5742b322f956 Uploaded
greg
parents:
diff changeset
85 <param name="modeOpt" type="select" label="Choose computation mode"
5742b322f956 Uploaded
greg
parents:
diff changeset
86 help="In the bins mode, the correlation is computed based on equal length bins. In the BED file mode, as list of genomic regions in BED format has to be given. For each region in the BED file the number of overlapping reads is counted in each of the BAM files. Then the correlation is computed.">
5742b322f956 Uploaded
greg
parents:
diff changeset
87 <option value="bins" selected="true">Bins</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
88 <option value="BED-file">Limit correlation to certain regions (BED file)</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
89 </param>
5742b322f956 Uploaded
greg
parents:
diff changeset
90 <when value="bins">
5742b322f956 Uploaded
greg
parents:
diff changeset
91 <param name="binSize" type="integer" value="10000" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
92 label="Bin size in bp"
5742b322f956 Uploaded
greg
parents:
diff changeset
93 help="Length in base pairs for a window used to sample the genome."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
94
5742b322f956 Uploaded
greg
parents:
diff changeset
95 <param name="numberOfSamples" type="integer" value="100000" min="1"
5742b322f956 Uploaded
greg
parents:
diff changeset
96 label="Number of samples"
5742b322f956 Uploaded
greg
parents:
diff changeset
97 help="Number of samples taken from the genome to compute the scaling factors"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
98 <expand macro="bamCorrelate_mode_actions" />
5742b322f956 Uploaded
greg
parents:
diff changeset
99 </when>
5742b322f956 Uploaded
greg
parents:
diff changeset
100 <when value="BED-file">
5742b322f956 Uploaded
greg
parents:
diff changeset
101 <param name="region_file" type="data" format="bed" label="Region file in BED format" help="Correlation is computed for the number of reads that overlap such regions."/>
5742b322f956 Uploaded
greg
parents:
diff changeset
102 <expand macro="bamCorrelate_mode_actions" />
5742b322f956 Uploaded
greg
parents:
diff changeset
103 </when>
5742b322f956 Uploaded
greg
parents:
diff changeset
104
5742b322f956 Uploaded
greg
parents:
diff changeset
105 </conditional>
5742b322f956 Uploaded
greg
parents:
diff changeset
106
5742b322f956 Uploaded
greg
parents:
diff changeset
107 <conditional name="outputOpt">
5742b322f956 Uploaded
greg
parents:
diff changeset
108 <param name="showOutputOpt" type="select" label="Show additional output options" >
5742b322f956 Uploaded
greg
parents:
diff changeset
109 <option value="no" selected="true">no</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
110 <option value="yes">yes</option>
5742b322f956 Uploaded
greg
parents:
diff changeset
111 </param>
5742b322f956 Uploaded
greg
parents:
diff changeset
112 <when value="no" />
5742b322f956 Uploaded
greg
parents:
diff changeset
113 <when value="yes">
5742b322f956 Uploaded
greg
parents:
diff changeset
114 <param name="saveRawCounts" type="boolean" label="Save the bin counts"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
115 <param name="saveCorMatrix" type="boolean" label="Save the correlation matrix"/>
5742b322f956 Uploaded
greg
parents:
diff changeset
116 </when>
5742b322f956 Uploaded
greg
parents:
diff changeset
117 </conditional>
5742b322f956 Uploaded
greg
parents:
diff changeset
118
5742b322f956 Uploaded
greg
parents:
diff changeset
119 </inputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
120 <outputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
121 <data format="png" name="outFileName" />
5742b322f956 Uploaded
greg
parents:
diff changeset
122 <data format="tabular" name="outFileRawCounts" label="${tool.name} on ${on_string}: bin counts">
5742b322f956 Uploaded
greg
parents:
diff changeset
123 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveRawCounts'] == True)</filter>
5742b322f956 Uploaded
greg
parents:
diff changeset
124 </data>
5742b322f956 Uploaded
greg
parents:
diff changeset
125 <data format="tabular" name="outFileCorMatrix" label="${tool.name} on ${on_string}: correlation matrix">
5742b322f956 Uploaded
greg
parents:
diff changeset
126 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveCorMatrix'] == True)</filter>
5742b322f956 Uploaded
greg
parents:
diff changeset
127 </data>
5742b322f956 Uploaded
greg
parents:
diff changeset
128 </outputs>
5742b322f956 Uploaded
greg
parents:
diff changeset
129 <help>
5742b322f956 Uploaded
greg
parents:
diff changeset
130
5742b322f956 Uploaded
greg
parents:
diff changeset
131 **What it does**
5742b322f956 Uploaded
greg
parents:
diff changeset
132
5742b322f956 Uploaded
greg
parents:
diff changeset
133 This tool is useful to assess the overall similarity of different BAM files. A typical application
5742b322f956 Uploaded
greg
parents:
diff changeset
134 is to check the correlation between replicates or published data sets.
5742b322f956 Uploaded
greg
parents:
diff changeset
135
5742b322f956 Uploaded
greg
parents:
diff changeset
136 The tool splits the genomes into bins of given length. For each bin, the number of reads
5742b322f956 Uploaded
greg
parents:
diff changeset
137 found in each BAM file is counted and a correlation is computed for all
5742b322f956 Uploaded
greg
parents:
diff changeset
138 pairs of BAM files.
5742b322f956 Uploaded
greg
parents:
diff changeset
139
5742b322f956 Uploaded
greg
parents:
diff changeset
140
5742b322f956 Uploaded
greg
parents:
diff changeset
141 .. image:: $PATH_TO_IMAGES/QC_bamCorrelate_humanSamples.png
5742b322f956 Uploaded
greg
parents:
diff changeset
142 :alt: Heatmap of RNA Polymerase II ChIP-seq
5742b322f956 Uploaded
greg
parents:
diff changeset
143
5742b322f956 Uploaded
greg
parents:
diff changeset
144
5742b322f956 Uploaded
greg
parents:
diff changeset
145 **Output files**:
5742b322f956 Uploaded
greg
parents:
diff changeset
146
5742b322f956 Uploaded
greg
parents:
diff changeset
147 - diagnostic plot produced by bamCorrelate is a clustered heatmap displaying the values for each pair-wise correlation, see below for an example
5742b322f956 Uploaded
greg
parents:
diff changeset
148 - data matrix (optional) in case you want to plot the correlation values using a different program, e.g. R, this matrix can be used
5742b322f956 Uploaded
greg
parents:
diff changeset
149
5742b322f956 Uploaded
greg
parents:
diff changeset
150
5742b322f956 Uploaded
greg
parents:
diff changeset
151
5742b322f956 Uploaded
greg
parents:
diff changeset
152
5742b322f956 Uploaded
greg
parents:
diff changeset
153 -----
5742b322f956 Uploaded
greg
parents:
diff changeset
154
5742b322f956 Uploaded
greg
parents:
diff changeset
155 .. class:: infomark
5742b322f956 Uploaded
greg
parents:
diff changeset
156
5742b322f956 Uploaded
greg
parents:
diff changeset
157 @REFERENCES@
5742b322f956 Uploaded
greg
parents:
diff changeset
158
5742b322f956 Uploaded
greg
parents:
diff changeset
159 </help>
5742b322f956 Uploaded
greg
parents:
diff changeset
160 </tool>