annotate ideas_preprocessor.xml @ 21:99102499271a draft

Uploaded
author greg
date Wed, 31 Jan 2018 08:22:43 -0500
parents 237ee7319452
children 3651f1592f3f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
1 <tool id="ideas_preprocessor" name="IDEAS Preprocessor" version="1.0.0">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
2 <description></description>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
3 <requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
4 <requirement type="package" version="2.5.4">deeptools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
5 <requirement type="package" version="1.10.4">r-data.table</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
6 <requirement type="package" version="1.4.4">r-optparse</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
7 <requirement type="package" version="1.6">samtools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
8 <requirement type="package" version="357">ucsc-bigwigaverageoverbed</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
9 </requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
11 #set chromosome_windows = "chromosome_windows.txt"
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
12 #set ideaspre_input_config = "ideaspre_input_config.txt"
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
13 #set specify_chrom_windows = $specify_chrom_windows_cond.specify_chrom_windows
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
14 mkdir $output.files_path &&
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
15 #if str($specify_chrom_windows) == "yes":
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
16 ##############################################
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
17 ## Using a bed file for defining chrom windows,
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
18 ## so categorize the window positions by
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
19 ## chromosome to enable the IDEAS -inv option.
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
20 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
21 cp '$gen_chromosome_windows' $chromosome_windows &&
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
22 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
23 ##############################################
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
24 ## Create the config file and prepare the data
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
25 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
26 cp '$gen_ideaspre_input_config' $ideaspre_input_config &&
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
27 sort $ideaspre_input_config -o $ideaspre_input_config &&
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
28 Rscript '$__tool_directory__/ideas_preprocessor.R'
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
29 --ideaspre_input_config '$ideaspre_input_config'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
30 #if str($specify_chrom_windows) == "yes":
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
31 --chromosome_windows '$chromosome_windows'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
32 --chrom_bed_input '$specify_chrom_windows_cond.chrom_bed_input'
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
33 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
34 --chrom_len_file '$chromInfo'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
35 --window_size $specify_chrom_windows_cond.window_size
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
36 #set restrict_chromosomes = $specify_chrom_windows_cond.restrict_chromosomes_cond.restrict_chromosomes
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
37 #if str($restrict_chromosomes) == "yes":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
38 #set chroms = []
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
39 #set chrom_repeat = $specify_chrom_windows_cond.restrict_chromosomes_cond.chrom_repeat
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
40 #for $i in $chrom_repeat.chrom
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
41 $chroms.append($i)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
42 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
43 --restrict_to_chroms ",".join(chroms)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
44 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
45 #end if
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
46 #if str($bychr) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
47 --bychr true
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
48 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
49 --reads_per_bp $reads_per_bp
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
50 #if str($exclude_bed_input) not in ["None", ""]:
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
51 --exclude_bed_input '$exclude_bed_input'
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
52 #end if
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
53 #if str($standardize_datasets) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
54 --standardize_datasets true
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
55 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
56 --output '$output'
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
57 --output_files_path '$output.files_path'
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
58 &> ideas_preprocessor_log.txt;
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
59 if [[ $? -ne 0 ]]; then
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
60 cp ideas_preprocessor_log.txt '$output';
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
61 exit 1;
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
62 fi
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
63 ]]></command>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
64 <configfiles>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
65 <configfile name="gen_ideaspre_input_config"><![CDATA[#if str($cell_type_epigenetic_factor_cond.cell_type_epigenetic_factor) == "extract":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
66 #set input_name_positions = $cell_type_epigenetic_factor_cond.input_name_positions
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
67 #for $i in $cell_type_epigenetic_factor_cond.input:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
68 #set file_name_with_ext = $i.name
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
69 #if str($file_name_with_ext).find("http") >= 0 or str($file_name_with_ext).find("ftp") >= 0:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
70 #set file_name_with_ext = $file_name_with_ext.split('/')[-1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
71 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
72 #assert str($file_name_with_ext).find("-") >= 0, "The selected input '%s' is invalid because it does not include the '-' character which is required when setting cell type and epigenetic factor names by extracting them from the input file names." % $file_name_with_ext
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
73 #set file_name = $file_name_with_ext.split(".")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
74 #if str($input_name_positions) == "cell_first":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
75 #set cell_type_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
76 #set epigenetic_factor_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
77 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
78 #set cell_type_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
79 #set epigenetic_factor_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
80 #end if
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
81 ${cell_type_name} ${epigenetic_factor_name} ${i} ${file_name} ${i.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
82 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
83 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
84 #for $input_items in $cell_type_epigenetic_factor_cond.input_repeat:
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
85 ${input_items.cell_type_name} ${input_items.epigenetic_factor_name} ${input_items.input} ${file_name} ${input_items.input.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
86 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
87 #end if]]></configfile>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
88 <configfile name="gen_chromosome_windows"><![CDATA[#if str($specify_chrom_windows_cond.specify_chrom_windows) == "yes":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
89 #import collections
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
90 #set window_positions_by_chroms_odict = $collections.OrderedDict()
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
91 #for count, line in enumerate(open($specify_chrom_windows_cond.chrom_bed_input.file_name, 'r')):
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
92 #set $line = $line.strip()
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
93 #if not $line or $line.startswith('#'):
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
94 #continue
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
95 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
96 #set items = $line.split('\t')
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
97 #if $items[0] in $window_positions_by_chroms_odict:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
98 #set tup = $window_positions_by_chroms_odict[$items[0]]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
99 #set $tup[1] += 1
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
100 #set $window_positions_by_chroms_odict[$items[0]] = $tup
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
101 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
102 #set $window_positions_by_chroms_odict[$items[0]] = [$count, $count+1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
103 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
104 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
105 #for $chrom, $tup in $window_positions_by_chroms_odict.items():
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
106 ${chrom} ${tup[0]} ${tup[1]}
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
107 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
108 #end if]]></configfile>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
109 </configfiles>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
110 <inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
111 <conditional name="cell_type_epigenetic_factor_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
112 <param name="cell_type_epigenetic_factor" type="select" label="Set cell type and epigenetic factor names by">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
113 <option value="extract" selected="true">extracting them from the selected input file names</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
114 <option value="manual">manually setting them for each selected input</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
115 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
116 <when value="extract">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
117 <param name="input" type="data" format="bigwig,bam" multiple="True" label="BAM or BigWig files">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
118 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
119 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
120 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
121 <param name="input_name_positions" type="select" display="radio" label="Selected input file name pattern is" help="A '-' character must separate cell type and epigenetic factor names within the selected input file names">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
122 <option value="cell_first" selected="true">Cell type name - Epigenetic factor name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
123 <option value="cell_last">Epigenetic factor name - Cell type name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
124 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
125 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
126 <when value="manual">
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
127 <repeat name="input_repeat" title="Cell type, epigenetic factor and input" min="1">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
128 <param name="cell_type_name" type="text" value="" label="Cell type name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
129 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
130 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
131 <param name="epigenetic_factor_name" type="text" value="" label="Epigenetic factor name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
132 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
133 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
134 <param name="input" type="data" format="bigwig,bam" label="BAM or BigWig file">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
135 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
136 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
137 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
138 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
139 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
140 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
141 <conditional name="specify_chrom_windows_cond">
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
142 <param name="specify_chrom_windows" type="select" label="Define chromosome window positions from a bed file?">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
143 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
144 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
145 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
146 <when value="no">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
147 <param name="window_size" type="integer" value="200" label="Window size in base pairs"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
148 <conditional name="restrict_chromosomes_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
149 <param name="restrict_chromosomes" type="select" label="Restrict processing to specified chromosomes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
150 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
151 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
152 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
153 <when value="no"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
154 <when value="yes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
155 <repeat name="chrom_repeat" title="Chromosomes" min="1">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
156 <param name="chrom" type="text" value="" label="Chromosome" help="One chromosome (e.g., chr1, chr2, chrX) per text field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
157 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
158 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
159 </conditional>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
160 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
161 <when value="yes">
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
162 <param name="chrom_bed_input" type="data" format="bed" label="Select bed file for defining chromosome window positions">
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
163 <validator type="empty_dataset"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
164 </param>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
165 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
166 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
167 <param name="bychr" type="boolean" truevalue="true" falsevalue="" checked="False" label="Output chromosomes in separate files"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
168 <param name="reads_per_bp" type="select" display="radio" label="Calculate the signal in each window using">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
169 <option value="6" selected="true">mean</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
170 <option value="8">max</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
171 </param>
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
172 <param name="exclude_bed_input" type="data" format="bed" optional="True" multiple="True" label="Select bed file(s) containing regions to exclude"/>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
173 <param name="standardize_datasets" type="boolean" truevalue="true" falsevalue="" checked="False" label="Standardize all datasets"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
174 </inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
175 <outputs>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
176 <data name="output" format="ideaspre"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
177 </outputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
178 <tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
179 <test>
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
180 <param name="input" value="e001-h3k4me3.bigwig" ftype="bigwig" dbkey="hg19"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
181 <param name="specify_chrom_windows" value="yes"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
182 <param name="chrom_bed_input" value="chrom_windows.bed" ftype="bed" dbkey="hg19"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
183 <output name="output" file="output.ideaspre" ftype="ideaspre" />
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
184 </test>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
185 </tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
186 <help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
187 **What it does**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
188
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
189 Takes as input a list of epigenetic data sets (histones, chromatin accessibility, CpG methylation, TFs, etc.)
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
190 or any other whole-genome data sets (e.g., scores). Currently the supported data formats are BigWig and BAM.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
191 All data sets are mapped by to a common genomic coordinate in a selected assembly (user-provided window size
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
192 or 200bp windows by default). The user can specify regions to be considered or removed from the analysis.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
193 The input data may come from one cell type/condition/individual/time point (although this approach does not
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
194 fully utilize the advantages of IDEAS), or from multiple cell types/conditions/individuals/time points. The
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
195 same set of epigenetic features may not be present in all cell types, in which case IDEAS perfroms imputation
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
196 of the missing tracks if specified. This tool produces a single dataset with the **IdeasPre** datatype for
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
197 use as input to the IDEAS tool.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
198
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
199 -----
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
200
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
201 **Required options**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
202
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
203 * **Set cell type and epigenetic factor names by** - cell type and epigenetic factor names can be set manually or by extracting them from the names of the selected input datasets. The latter case requires all selected datasets to have names that contain a "-" character.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
204
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
205 * **BAM or BigWig files** - select one or more Bam or Bigwig files from your history, making sure that the name of every selected input include a "-" character (e.g., e001-h3k4me3.bigwig).
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
206 * **Cell type, Epigenetic factor and Input** - manually select any number of inputs, setting the cell type and epigenetic factor name for each. The combination of "cell type name" and "epigenetic factor name" must be unique for each input. For example, if you have replicate data you may want to specify the cell name as "rep1", "rep2", etc and the factor name as "rep1", "rep2", etc.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
207
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
208 * **Cell type name** - cell type name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
209 * **Epigenetic factor name** - epigenetic factor name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
210 * **BAM or BigWig file** - BAM or BigWig file.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
211 * **Selected input file name pattern is** - select the file name pattern, either **epigenetic factor name-cell type name** or **cell type name-epigenetic factor name**.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
212
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
213 * **Define chromosome window positions from a bed file** - select "No" to run whole genome segmentation or select "Yes" to segment genomes within the unit of the windows defined by the bed file. This file can be in BED3, BED4 or BED5 format, but only the first three columns (chr posst posed) will be used.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
214
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
215 * **Window size in base pairs** - Window size in base pairs if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
216 * **Restrict processing to specified chromosomes** - select "Yes" to restrict processing to specified chromosomes.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
217
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
218 * **Chromosomes** - enter a comma-separated list of chromosomes for processing.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
219
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
220 * **Select bed file for defining chromosome window positions** - select a bed file for specifying the chromosome window positions.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
221
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
222 * **Output chromosomes in separate files** - select "Yes" to produce separate files for each chromosome, allowing you to run IDEAS on different chromosomes separately.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
223 * **Calculate the signal in each window using** - use the bigWigAverageOverBed utility from the UCSC genome browser to calculate the signal (i.e., the number of reads per bp) in each window.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
224 * **Select bed file(s) containing regions to exclude** - select one or more bed files that contains regions you'd like excluded from your datasets.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
225 * **Standardize all datasets** - select "Yes" to standardize all datasets (e.g., reads / total_reads * 20 million) so that the signals from different cell types become comparable - your datasets can be read counts, logp-values or fold change.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
226
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
227 </help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
228 <citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
229 <citation type="doi">10.1093/nar/gkw278</citation>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
230 </citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
231 </tool>