annotate ideas_preprocessor.xml @ 22:3651f1592f3f draft

Uploaded
author greg
date Wed, 31 Jan 2018 14:13:11 -0500
parents 237ee7319452
children 71345e154c66
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
1 <tool id="ideas_preprocessor" name="IDEAS Preprocessor" version="1.0.0">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
2 <description></description>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
3 <requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
4 <requirement type="package" version="2.5.4">deeptools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
5 <requirement type="package" version="1.10.4">r-data.table</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
6 <requirement type="package" version="1.4.4">r-optparse</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
7 <requirement type="package" version="1.6">samtools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
8 <requirement type="package" version="357">ucsc-bigwigaverageoverbed</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
9 </requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
11 #set chromosome_windows = "chromosome_windows.txt"
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
12 #set ideaspre_input_config = "ideaspre_input_config.txt"
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
13 #set specify_chrom_windows = $specify_chrom_windows_cond.specify_chrom_windows
22
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
14 #set tmp_dir = "tmp"
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
15 mkdir $tmp_dir &&
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
16 mkdir $output.files_path &&
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
17 #if str($specify_chrom_windows) == "yes":
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
18 ##############################################
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
19 ## Using a bed file for defining chrom windows,
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
20 ## so categorize the window positions by
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
21 ## chromosome to enable the IDEAS -inv option.
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
22 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
23 cp '$gen_chromosome_windows' $chromosome_windows &&
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
24 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
25 ##############################################
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
26 ## Create the config file and prepare the data
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
27 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
28 cp '$gen_ideaspre_input_config' $ideaspre_input_config &&
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
29 sort $ideaspre_input_config -o $ideaspre_input_config &&
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
30 Rscript '$__tool_directory__/ideas_preprocessor.R'
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
31 --ideaspre_input_config '$ideaspre_input_config'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
32 #if str($specify_chrom_windows) == "yes":
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
33 --chromosome_windows '$chromosome_windows'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
34 --chrom_bed_input '$specify_chrom_windows_cond.chrom_bed_input'
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
35 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
36 --chrom_len_file '$chromInfo'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
37 --window_size $specify_chrom_windows_cond.window_size
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
38 #set restrict_chromosomes = $specify_chrom_windows_cond.restrict_chromosomes_cond.restrict_chromosomes
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
39 #if str($restrict_chromosomes) == "yes":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
40 #set chroms = []
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
41 #set chrom_repeat = $specify_chrom_windows_cond.restrict_chromosomes_cond.chrom_repeat
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
42 #for $i in $chrom_repeat.chrom
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
43 $chroms.append($i)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
44 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
45 --restrict_to_chroms ",".join(chroms)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
46 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
47 #end if
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
48 #if str($bychr) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
49 --bychr true
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
50 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
51 --reads_per_bp $reads_per_bp
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
52 #if str($exclude_bed_input) not in ["None", ""]:
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
53 --exclude_bed_input '$exclude_bed_input'
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
54 #end if
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
55 #if str($standardize_datasets) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
56 --standardize_datasets true
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
57 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
58 --output '$output'
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
59 --output_files_path '$output.files_path'
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
60 &> ideas_preprocessor_log.txt;
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
61 if [[ $? -ne 0 ]]; then
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
62 cp ideas_preprocessor_log.txt '$output';
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
63 exit 1;
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
64 fi
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
65 ]]></command>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
66 <configfiles>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
67 <configfile name="gen_ideaspre_input_config"><![CDATA[#if str($cell_type_epigenetic_factor_cond.cell_type_epigenetic_factor) == "extract":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
68 #set input_name_positions = $cell_type_epigenetic_factor_cond.input_name_positions
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
69 #for $i in $cell_type_epigenetic_factor_cond.input:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
70 #set file_name_with_ext = $i.name
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
71 #if str($file_name_with_ext).find("http") >= 0 or str($file_name_with_ext).find("ftp") >= 0:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
72 #set file_name_with_ext = $file_name_with_ext.split('/')[-1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
73 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
74 #assert str($file_name_with_ext).find("-") >= 0, "The selected input '%s' is invalid because it does not include the '-' character which is required when setting cell type and epigenetic factor names by extracting them from the input file names." % $file_name_with_ext
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
75 #set file_name = $file_name_with_ext.split(".")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
76 #if str($input_name_positions) == "cell_first":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
77 #set cell_type_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
78 #set epigenetic_factor_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
79 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
80 #set cell_type_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
81 #set epigenetic_factor_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
82 #end if
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
83 ${cell_type_name} ${epigenetic_factor_name} ${i} ${file_name} ${i.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
84 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
85 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
86 #for $input_items in $cell_type_epigenetic_factor_cond.input_repeat:
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
87 ${input_items.cell_type_name} ${input_items.epigenetic_factor_name} ${input_items.input} ${file_name} ${input_items.input.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
88 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
89 #end if]]></configfile>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
90 <configfile name="gen_chromosome_windows"><![CDATA[#if str($specify_chrom_windows_cond.specify_chrom_windows) == "yes":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
91 #import collections
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
92 #set window_positions_by_chroms_odict = $collections.OrderedDict()
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
93 #for count, line in enumerate(open($specify_chrom_windows_cond.chrom_bed_input.file_name, 'r')):
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
94 #set $line = $line.strip()
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
95 #if not $line or $line.startswith('#'):
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
96 #continue
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
97 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
98 #set items = $line.split('\t')
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
99 #if $items[0] in $window_positions_by_chroms_odict:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
100 #set tup = $window_positions_by_chroms_odict[$items[0]]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
101 #set $tup[1] += 1
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
102 #set $window_positions_by_chroms_odict[$items[0]] = $tup
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
103 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
104 #set $window_positions_by_chroms_odict[$items[0]] = [$count, $count+1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
105 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
106 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
107 #for $chrom, $tup in $window_positions_by_chroms_odict.items():
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
108 ${chrom} ${tup[0]} ${tup[1]}
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
109 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
110 #end if]]></configfile>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
111 </configfiles>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
112 <inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
113 <conditional name="cell_type_epigenetic_factor_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
114 <param name="cell_type_epigenetic_factor" type="select" label="Set cell type and epigenetic factor names by">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
115 <option value="extract" selected="true">extracting them from the selected input file names</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
116 <option value="manual">manually setting them for each selected input</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
117 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
118 <when value="extract">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
119 <param name="input" type="data" format="bigwig,bam" multiple="True" label="BAM or BigWig files">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
120 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
121 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
122 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
123 <param name="input_name_positions" type="select" display="radio" label="Selected input file name pattern is" help="A '-' character must separate cell type and epigenetic factor names within the selected input file names">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
124 <option value="cell_first" selected="true">Cell type name - Epigenetic factor name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
125 <option value="cell_last">Epigenetic factor name - Cell type name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
126 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
127 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
128 <when value="manual">
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
129 <repeat name="input_repeat" title="Cell type, epigenetic factor and input" min="1">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
130 <param name="cell_type_name" type="text" value="" label="Cell type name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
131 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
132 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
133 <param name="epigenetic_factor_name" type="text" value="" label="Epigenetic factor name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
134 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
135 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
136 <param name="input" type="data" format="bigwig,bam" label="BAM or BigWig file">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
137 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
138 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
139 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
140 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
141 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
142 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
143 <conditional name="specify_chrom_windows_cond">
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
144 <param name="specify_chrom_windows" type="select" label="Define chromosome window positions from a bed file?">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
145 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
146 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
147 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
148 <when value="no">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
149 <param name="window_size" type="integer" value="200" label="Window size in base pairs"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
150 <conditional name="restrict_chromosomes_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
151 <param name="restrict_chromosomes" type="select" label="Restrict processing to specified chromosomes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
152 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
153 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
154 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
155 <when value="no"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
156 <when value="yes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
157 <repeat name="chrom_repeat" title="Chromosomes" min="1">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
158 <param name="chrom" type="text" value="" label="Chromosome" help="One chromosome (e.g., chr1, chr2, chrX) per text field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
159 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
160 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
161 </conditional>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
162 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
163 <when value="yes">
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
164 <param name="chrom_bed_input" type="data" format="bed" label="Select bed file for defining chromosome window positions">
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
165 <validator type="empty_dataset"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
166 </param>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
167 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
168 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
169 <param name="bychr" type="boolean" truevalue="true" falsevalue="" checked="False" label="Output chromosomes in separate files"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
170 <param name="reads_per_bp" type="select" display="radio" label="Calculate the signal in each window using">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
171 <option value="6" selected="true">mean</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
172 <option value="8">max</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
173 </param>
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
174 <param name="exclude_bed_input" type="data" format="bed" optional="True" multiple="True" label="Select bed file(s) containing regions to exclude"/>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
175 <param name="standardize_datasets" type="boolean" truevalue="true" falsevalue="" checked="False" label="Standardize all datasets"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
176 </inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
177 <outputs>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
178 <data name="output" format="ideaspre"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
179 </outputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
180 <tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
181 <test>
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
182 <param name="input" value="e001-h3k4me3.bigwig" ftype="bigwig" dbkey="hg19"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
183 <param name="specify_chrom_windows" value="yes"/>
22
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
184 <param name="chrom_bed_input" value="chromosomes.bed" ftype="bed" dbkey="hg19"/>
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
185 <output name="output" file="output.html" ftype="ideaspre">
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
186 <extra_files type="file" name="chromosomes.bed" value="chromosomes.bed"/>
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
187 <extra_files type="file" name="chromosome_windows.txt" value="chromosome_windows.txt"/>
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
188 <extra_files type="file" name="IDEAS_input_config.txt" value="IDEAS_input_config.txt"/>
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
189 <extra_files type="file" name="tmp.tar" value="tmp.tar" compare="sim_size"/>
3651f1592f3f Uploaded
greg
parents: 20
diff changeset
190 </output>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
191 </test>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
192 </tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
193 <help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
194 **What it does**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
195
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
196 Takes as input a list of epigenetic data sets (histones, chromatin accessibility, CpG methylation, TFs, etc.)
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
197 or any other whole-genome data sets (e.g., scores). Currently the supported data formats are BigWig and BAM.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
198 All data sets are mapped by to a common genomic coordinate in a selected assembly (user-provided window size
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
199 or 200bp windows by default). The user can specify regions to be considered or removed from the analysis.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
200 The input data may come from one cell type/condition/individual/time point (although this approach does not
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
201 fully utilize the advantages of IDEAS), or from multiple cell types/conditions/individuals/time points. The
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
202 same set of epigenetic features may not be present in all cell types, in which case IDEAS perfroms imputation
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
203 of the missing tracks if specified. This tool produces a single dataset with the **IdeasPre** datatype for
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
204 use as input to the IDEAS tool.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
205
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
206 -----
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
207
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
208 **Required options**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
209
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
210 * **Set cell type and epigenetic factor names by** - cell type and epigenetic factor names can be set manually or by extracting them from the names of the selected input datasets. The latter case requires all selected datasets to have names that contain a "-" character.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
211
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
212 * **BAM or BigWig files** - select one or more Bam or Bigwig files from your history, making sure that the name of every selected input include a "-" character (e.g., e001-h3k4me3.bigwig).
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
213 * **Cell type, Epigenetic factor and Input** - manually select any number of inputs, setting the cell type and epigenetic factor name for each. The combination of "cell type name" and "epigenetic factor name" must be unique for each input. For example, if you have replicate data you may want to specify the cell name as "rep1", "rep2", etc and the factor name as "rep1", "rep2", etc.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
214
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
215 * **Cell type name** - cell type name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
216 * **Epigenetic factor name** - epigenetic factor name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
217 * **BAM or BigWig file** - BAM or BigWig file.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
218 * **Selected input file name pattern is** - select the file name pattern, either **epigenetic factor name-cell type name** or **cell type name-epigenetic factor name**.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
219
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
220 * **Define chromosome window positions from a bed file** - select "No" to run whole genome segmentation or select "Yes" to segment genomes within the unit of the windows defined by the bed file. This file can be in BED3, BED4 or BED5 format, but only the first three columns (chr posst posed) will be used.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
221
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
222 * **Window size in base pairs** - Window size in base pairs if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
223 * **Restrict processing to specified chromosomes** - select "Yes" to restrict processing to specified chromosomes.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
224
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
225 * **Chromosomes** - enter a comma-separated list of chromosomes for processing.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
226
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
227 * **Select bed file for defining chromosome window positions** - select a bed file for specifying the chromosome window positions.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
228
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
229 * **Output chromosomes in separate files** - select "Yes" to produce separate files for each chromosome, allowing you to run IDEAS on different chromosomes separately.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
230 * **Calculate the signal in each window using** - use the bigWigAverageOverBed utility from the UCSC genome browser to calculate the signal (i.e., the number of reads per bp) in each window.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
231 * **Select bed file(s) containing regions to exclude** - select one or more bed files that contains regions you'd like excluded from your datasets.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
232 * **Standardize all datasets** - select "Yes" to standardize all datasets (e.g., reads / total_reads * 20 million) so that the signals from different cell types become comparable - your datasets can be read counts, logp-values or fold change.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
233
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
234 </help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
235 <citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
236 <citation type="doi">10.1093/nar/gkw278</citation>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
237 </citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
238 </tool>