annotate realigner_target_creator.xml @ 9:fc0e2a67ace8 draft

Uploaded
author iuc
date Tue, 07 Apr 2015 22:46:05 -0400
parents b80301676614
children 0d369d08ad6e
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
1 <tool id="gatk2_realigner_target_creator" name="Realigner Target Creator" version="@VERSION@.1">
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
2 <description>for use in local realignment</description>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
3 <expand macro="requirements" />
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
4 <expand macro="version_command" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
5 <macros>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
6 <import>gatk2_macros.xml</import>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
7 </macros>
1
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
8 <command interpreter="python">
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
9 gatk2_wrapper.py
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
10 --stdout "${output_log}"
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
11 -d "-I" "${reference_source.input_bam}" "${reference_source.input_bam.ext}" "gatk_input"
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
12 #if str( $reference_source.input_bam.metadata.bam_index ) != "None":
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
13 -d "" "${reference_source.input_bam.metadata.bam_index}" "bam_index" "gatk_input" ##hardcode galaxy ext type as bam_index
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
14 #end if
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
15 -p '
c8752e31f496 Uploaded
bgruening
parents: 0
diff changeset
16 @JAR_PATH@
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
17 -T "RealignerTargetCreator"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
18 -o "${output_interval}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
19
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
20 \$GATK2_SITE_OPTIONS
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
21
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
22 ## according to http://www.broadinstitute.org/gatk/guide/article?id=1975
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
23 --num_cpu_threads_per_data_thread 1
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
24
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
25 @THREADS@
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
26
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
27 #if $reference_source.reference_source_selector != "history":
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
28 -R "${reference_source.ref_file.fields.path}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
29 #end if
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
30 '
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
31 #set $rod_binding_names = dict()
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
32 #for $rod_binding in $rod_bind:
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
33 #if str( $rod_binding.rod_bind_type.rod_bind_type_selector ) == 'custom':
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
34 #set $rod_bind_name = $rod_binding.rod_bind_type.custom_rod_name
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
35 #else
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
36 #set $rod_bind_name = $rod_binding.rod_bind_type.rod_bind_type_selector
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
37 #end if
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
38 #set $rod_binding_names[$rod_bind_name] = $rod_binding_names.get( $rod_bind_name, -1 ) + 1
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
39 -d "-known:${rod_bind_name},%(file_type)s" "${rod_binding.rod_bind_type.input_rod}" "${rod_binding.rod_bind_type.input_rod.ext}" "input_${rod_bind_name}_${rod_binding_names[$rod_bind_name]}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
40 #end for
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
41
b80301676614 Uploaded
iuc
parents: 2
diff changeset
42 $allow_n_cigar_reads
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
43 #include source=$standard_gatk_options#
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
44 ##start analysis specific options
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
45 #if $analysis_param_type.analysis_param_type_selector == "advanced":
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
46 -p '
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
47 --minReadsAtLocus "${analysis_param_type.minReadsAtLocus}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
48 --windowSize "${analysis_param_type.windowSize}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
49 --mismatchFraction "${analysis_param_type.mismatchFraction}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
50 --maxIntervalSize "${analysis_param_type.maxIntervalSize}"
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
51 '
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
52 #end if
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
53 </command>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
54 <inputs>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
55 <conditional name="reference_source">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
56 <expand macro="reference_source_selector_param" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
57 <when value="cached">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
58 <param name="input_bam" type="data" format="bam" label="BAM file" help="-I,--input_file &amp;lt;input_file&amp;gt;">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
59 <validator type="unspecified_build" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
60 <validator type="dataset_metadata_in_data_table" table_name="gatk2_picard_indexes" metadata_name="dbkey" metadata_column="dbkey" message="Sequences are not currently available for the specified build." /> <!-- fixme!!! this needs to be a select -->
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
61 </param>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
62 <param name="ref_file" type="select" label="Using reference genome" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;" >
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
63 <options from_data_table="gatk2_picard_indexes">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
64 <filter type="data_meta" key="dbkey" ref="input_bam" column="dbkey"/>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
65 </options>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
66 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
67 </param>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
68 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
69 <when value="history">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
70 <param name="input_bam" type="data" format="bam" label="BAM file" help="-I,--input_file &amp;lt;input_file&amp;gt;" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
71 <param name="ref_file" type="data" format="fasta" label="Using reference file" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;">
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
72 <options>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
73 <filter type="data_meta" key="dbkey" ref="input_bam" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
74 </options>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
75 </param>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
76 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
77 </conditional>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
78
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
79 <repeat name="rod_bind" title="Known Variants" help="Using data sets of known variants (-known,--known &amp;lt;known&amp;gt;)">
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
80 <conditional name="rod_bind_type">
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
81 <param name="rod_bind_type_selector" type="select" label="Variant Type">
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
82 <option value="dbsnp" selected="True">dbSNP</option>
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
83 <option value="snps">SNPs</option>
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
84 <option value="indels">INDELs</option>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
85 <option value="custom">Custom</option>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
86 </param>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
87 <when value="dbsnp">
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
88 <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
89 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
90 <when value="snps">
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
91 <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
92 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
93 <when value="indels">
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
94 <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
95 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
96 <when value="custom">
2
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
97 <param name="custom_rod_name" type="text" value="Unknown" label="Customer's variant file" />
28b85e2409ce Uploaded
bgruening
parents: 1
diff changeset
98 <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
99 </when>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
100 </conditional>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
101 </repeat>
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
102
b80301676614 Uploaded
iuc
parents: 2
diff changeset
103 <expand macro="allow_n_cigar_reads" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
104 <expand macro="gatk_param_type_conditional" />
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
105
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
106 <expand macro="analysis_type_conditional">
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
107 <param name="windowSize" type="integer" value="10" label="Window size for calculating entropy or SNP clusters (windowSize)"
b80301676614 Uploaded
iuc
parents: 2
diff changeset
108 help="-window,--windowSize &amp;lt;windowSize&amp;gt;" />
b80301676614 Uploaded
iuc
parents: 2
diff changeset
109 <param name="mismatchFraction" type="float" value="0.15" label="Fraction of base qualities needing to mismatch for a position to have high entropy (mismatchFraction)"
b80301676614 Uploaded
iuc
parents: 2
diff changeset
110 help="to disable set to &lt;= 0 or &gt; 1 (-mismatch,--mismatchFraction &amp;lt;mismatchFraction&amp;gt;)"/>
b80301676614 Uploaded
iuc
parents: 2
diff changeset
111 <param name="minReadsAtLocus" type="integer" value="4" label="Minimum reads at a locus to enable using the entropy calculation (minReadsAtLocus)"
b80301676614 Uploaded
iuc
parents: 2
diff changeset
112 help="-minReads,--minReadsAtLocus &amp;lt;minReadsAtLocus&amp;gt;" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
113 <param name="maxIntervalSize" type="integer" value="500" label="Maximum interval size" help="-maxInterval,--maxIntervalSize &amp;lt;maxIntervalSize&amp;gt;" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
114 </expand>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
115 </inputs>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
116 <outputs>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
117 <data format="gatk_interval" name="output_interval" label="${tool.name} on ${on_string} (GATK intervals)" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
118 <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
119 </outputs>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
120 <tests>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
121 <test>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
122 <param name="reference_source_selector" value="history" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
123 <param name="ref_file" value="phiX.fasta" ftype="fasta" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
124 <param name="input_bam" value="gatk/fake_phiX_reads_1.bam" ftype="bam" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
125 <param name="rod_bind_type_selector" value="dbsnp" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
126 <param name="input_rod" value="gatk/fake_phiX_variant_locations.vcf" ftype="vcf" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
127 <param name="gatk_param_type_selector" value="basic" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
128 <param name="analysis_param_type_selector" value="advanced" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
129 <param name="windowSize" value="10" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
130 <param name="mismatchFraction" value="0.15" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
131 <param name="minReadsAtLocus" value="4" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
132 <param name="maxIntervalSize" value="500" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
133 <output name="output_interval" file="gatk/gatk_realigner_target_creator/gatk_realigner_target_creator_out_1.gatk_interval" />
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
134 <output name="output_log" file="gatk/gatk_realigner_target_creator/gatk_realigner_target_creator_out_1.log.contains" compare="contains"/>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
135 </test>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
136 </tests>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
137 <help>
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
138 **What it does**
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
139
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
140 Emits intervals for the Local Indel Realigner to target for cleaning. Ignores 454 reads, MQ0 reads, and reads with consecutive indel operators in the CIGAR string.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
141
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
142 For more information on local realignment around indels using the GATK, see this `tool specific page &lt;http://www.broadinstitute.org/gatk/gatkdocs/org_broadinstitute_sting_gatk_walkers_indels_RealignerTargetCreator.html&gt;`_.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
143
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
144 To learn about best practices for variant detection using GATK, see this `overview &lt;http://www.broadinstitute.org/gatk/guide/topic?name=best-practices&gt;`_.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
145
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
146 If you encounter errors, please view the `GATK FAQ &lt;http://www.broadinstitute.org/gatk/guide/topic?name=faqs&gt;`_.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
147
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
148 ------
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
149
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
150 **Inputs**
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
151
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
152 GenomeAnalysisTK: RealignerTargetCreator accepts an aligned BAM input file.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
153
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
154
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
155 **Outputs**
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
156
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
157 The output is in GATK Interval format.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
158
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
159
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
160 Go `here &lt;http://www.broadinstitute.org/gatk/guide/topic?name=intro&gt;`_ for details on GATK file formats.
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
161
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
162 -------
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
163
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
164 **Settings**::
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
165
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
166 windowSize window size for calculating entropy or SNP clusters
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
167 mismatchFraction fraction of base qualities needing to mismatch for a position to have high entropy; to disable set to &lt;= 0 or &gt; 1
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
168 minReadsAtLocus minimum reads at a locus to enable using the entropy calculation
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
169 maxIntervalSize maximum interval size
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
170
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
171 @CITATION_SECTION@
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
172 </help>
6
b80301676614 Uploaded
iuc
parents: 2
diff changeset
173 <expand macro="citations" />
0
9ad15075b9fa Uploaded
iuc
parents:
diff changeset
174 </tool>