annotate variant_combine.xml @ 0:931e358ece8d draft default tip

Imported from capsule None
author devteam
date Tue, 01 Apr 2014 09:12:26 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
1 <tool id="gatk_variant_combine" name="Combine Variants" version="0.0.4">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
2 <description></description>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
3 <requirements>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
4 <requirement type="package" version="1.4">gatk</requirement>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
5 </requirements>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
6 <macros>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
7 <import>gatk_macros.xml</import>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
8 </macros>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
9 <command interpreter="python">gatk_wrapper.py
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
10 --max_jvm_heap_fraction "1"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
11 --stdout "${output_log}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
12
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
13 #set $priority_order = []
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
14 #for $input_variant in $reference_source.input_variants:
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
15 -d "--variant:${input_variant.input_variant_name},%(file_type)s" "${input_variant.input_variant}" "${input_variant.input_variant.ext}" "input_variant_${input_variant.input_variant_name}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
16 #set $input_variant_name = str( $input_variant.input_variant_name )
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
17 #assert $input_variant_name not in $priority_order, "Variant Names must be unique" ##this should be handled by a validator
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
18 #silent $priority_order.append( $input_variant_name )
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
19 #end for
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
20 -p 'java
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
21 -jar "\$JAVA_JAR_PATH/GenomeAnalysisTK.jar"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
22 -T "CombineVariants"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
23 --out "${output_variants}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
24 ##--num_threads 4 ##hard coded, for now
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
25 -et "NO_ET" ##ET no phone home
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
26 ##-log "${output_log}" ##don't use this to log to file, instead directly capture stdout
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
27 #if $reference_source.reference_source_selector != "history":
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
28 -R "${reference_source.ref_file.fields.path}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
29 #end if
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
30 --genotypemergeoption "${genotype_merge_option}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
31 --rod_priority_list "${ ','.join( $priority_order ) }"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
32 '
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
33
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
34 #include source=$standard_gatk_options#
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
35
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
36
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
37 ##start analysis specific options
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
38 #if $analysis_param_type.analysis_param_type_selector == "advanced":
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
39 -p '
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
40 --filteredrecordsmergetype "${analysis_param_type.filtered_records_merge_type}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
41 ${analysis_param_type.print_complex_merges}
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
42 ${analysis_param_type.filtered_are_uncalled}
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
43 ${analysis_param_type.minimal_vcf}
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
44 ${analysis_param_type.assume_identical_samples}
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
45
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
46 #if str( $analysis_param_type.set_key ):
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
47 --setKey "${analysis_param_type.set_key}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
48 #end if
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
49
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
50 --minimumN "${analysis_param_type.minimum_n}"
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
51 '
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
52 #end if
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
53 </command>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
54 <inputs>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
55
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
56 <conditional name="reference_source">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
57 <expand macro="reference_source_selector_param" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
58 <when value="cached">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
59 <repeat min="1" name="input_variants" title="Variants to Merge" help="Records will be prioritized in the order that you list them here (-V,--variant &amp;lt;variant&amp;gt;)">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
60 <param name="input_variant" type="data" format="vcf" label="Input variant file" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
61 <param name="input_variant_name" type="text" value="" label="Variant name" help="Names must be unique">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
62 <validator type="length" min="1" message="You must provide a unique name for this set of variants" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
63 </param>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
64 </repeat>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
65 <param name="ref_file" type="select" label="Using reference genome" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
66 <options from_data_table="gatk_picard_indexes">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
67 <!-- <filter type="data_meta" key="dbkey" ref="input_variants.input_variant" column="dbkey"/> -->
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
68 </options>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
69 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
70 </param>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
71 </when>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
72 <when value="history"> <!-- FIX ME!!!! -->
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
73 <repeat min="1" name="input_variants" title="Variants to Merge" help="Records will be prioritized in the order that you list them here (-V,--variant &amp;lt;variant&amp;gt;)">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
74 <param name="input_variant" type="data" format="vcf" label="Input variant file" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
75 <param name="input_variant_name" type="text" value="" label="Variant name" help="Names must be unique">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
76 <validator type="length" min="1" message="You must provide a unique name for this set of variants" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
77 </param>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
78 </repeat>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
79 <param name="ref_file" type="data" format="fasta" label="Using reference file" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
80 </when>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
81 </conditional>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
82
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
83 <param name="genotype_merge_option" type="select" label="How should we merge genotype records across records for samples shared across the ROD files" help="-genotypeMergeOptions,--genotypemergeoption &amp;lt;genotypemergeoption&amp;gt;" >
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
84 <option value="UNIQUIFY" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
85 <option value="PRIORITIZE" selected="true"/>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
86 <option value="UNSORTED" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
87 <option value="REQUIRE_UNIQUE" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
88 </param>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
89
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
90 <expand macro="gatk_param_type_conditional" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
91
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
92
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
93 <expand macro="analysis_type_conditional">
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
94 <param name="filtered_records_merge_type" type="select" label="How should we deal with records seen at the same site in the VCF, but with different FILTER fields?" help="-filteredRecordsMergeType,--filteredrecordsmergetype &amp;lt;filteredrecordsmergetype&amp;gt;" >
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
95 <option value="KEEP_IF_ANY_UNFILTERED" selected="true"/>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
96 <option value="KEEP_IF_ALL_UNFILTERED" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
97 </param>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
98
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
99 <param name="print_complex_merges" checked="false" type="boolean" truevalue="--printComplexMerges" falsevalue="" label="Print out interesting sites requiring complex compatibility merging" help="-printComplexMerges,--printComplexMerges" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
100 <param name="filtered_are_uncalled" checked="false" type="boolean" truevalue="--filteredAreUncalled" falsevalue="" label="If true, then filtered VCFs are treated as uncalled, so that filtered set annotation don't appear in the combined VCF" help="-filteredAreUncalled,--filteredAreUncalled" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
101 <param name="minimal_vcf" checked="false" type="boolean" truevalue="--minimalVCF" falsevalue="" label="If true, then the output VCF will contain no INFO or genotype INFO field" help="-minimalVCF,--minimalVCF" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
102
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
103 <param name="set_key" type="text" value="" label="Key, by default set, in the INFO key=value tag emitted describing which set the combined VCF record came from." help="-setKey,--setKey &amp;lt;setKey&amp;gt;"/>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
104 <param name="assume_identical_samples" checked="false" type="boolean" truevalue="--assumeIdenticalSamples" falsevalue="" label="If true, assume input VCFs have identical sample sets and disjoint calls so that one can simply perform a merge sort to combine the VCFs into one, drastically reducing the runtime." help="-assumeIdenticalSamples,--assumeIdenticalSamples" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
105 <param name="minimum_n" type="integer" value="1" label="Combine variants and output site only if variant is present in at least N input files." help="-minN,--minimumN &amp;lt;minimumN&amp;gt;"/>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
106
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
107 </expand>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
108
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
109
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
110 </inputs>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
111 <outputs>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
112 <data format="vcf" name="output_variants" label="${tool.name} on ${on_string} (variants)" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
113 <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
114 </outputs>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
115 <tests>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
116 <test>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
117 <param name="reference_source_selector" value="history" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
118 <param name="ref_file" value="phiX.fasta" ftype="fasta" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
119 <param name="input_variant" value="gatk/gatk_variant_annotator/gatk_variant_annotator_out_1.vcf" ftype="vcf" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
120 <param name="input_variant_name" value="from_variant_annotator" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
121 <param name="genotype_merge_option" value="PRIORITIZE" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
122 <param name="gatk_param_type_selector" value="basic" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
123 <param name="analysis_param_type_selector" value="basic" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
124 <output name="output_variants" file="gatk/gatk_variant_combine/gatk_variant_combine_out_1.vcf" lines_diff="4" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
125 <output name="output_log" file="gatk/gatk_variant_combine/gatk_variant_combine_out_1.log.contains" compare="contains" />
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
126 </test>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
127 </tests>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
128 <help>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
129 **What it does**
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
130
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
131 Combines VCF records from different sources; supports both full merges and set unions. Merge: combines multiple records into a single one; if sample names overlap then they are uniquified. Union: assumes each rod represents the same set of samples (although this is not enforced); using the priority list (if provided), emits a single record instance at every position represented in the rods.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
132
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
133 For more information on using the CombineVariants module, see this `tool specific page &lt;http://www.broadinstitute.org/gsa/wiki/index.php/CombineVariants&gt;`_.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
134
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
135 To learn about best practices for variant detection using GATK, see this `overview &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Best_Practice_Variant_Detection_with_the_GATK_v3&gt;`_.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
136
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
137 If you encounter errors, please view the `GATK FAQ &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Frequently_Asked_Questions&gt;`_.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
138
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
139 ------
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
140
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
141 **Inputs**
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
142
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
143 GenomeAnalysisTK: CombineVariants accepts variant files as input.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
144
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
145 ------
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
146
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
147 **Outputs**
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
148
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
149 The output is a combined vcf file.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
150
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
151
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
152 Go `here &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Input_files_for_the_GATK&gt;`_ for details on GATK file formats.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
153
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
154 -------
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
155
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
156 **Settings**::
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
157
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
158 out File to which variants should be written
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
159 genotypemergeoption How should we merge genotype records for samples shared across the ROD files? (UNIQUIFY|PRIORITIZE|UNSORTED|REQUIRE_UNIQUE)
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
160 filteredrecordsmergetype How should we deal with records seen at the same site in the VCF, but with different FILTER fields? KEEP_IF_ANY_UNFILTERED PASSes the record if any record is unfiltered, KEEP_IF_ALL_UNFILTERED requires all records to be unfiltered (KEEP_IF_ANY_UNFILTERED|KEEP_IF_ALL_UNFILTERED)
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
161 rod_priority_list When taking the union of variants containing genotypes: a comma-separated string describing the priority ordering for the genotypes as far as which record gets emitted; a complete priority list MUST be provided
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
162 printComplexMerges Print out interesting sites requiring complex compatibility merging
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
163 filteredAreUncalled If true, then filtered VCFs are treated as uncalled, so that filtered set annotation don't appear in the combined VCF
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
164 minimalVCF If true, then the output VCF will contain no INFO or genotype INFO field
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
165 setKey Key, by default set, in the INFO key=value tag emitted describing which set the combined VCF record came from. Set to null if you don't want the set field emitted.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
166 assumeIdenticalSamples If true, assume input VCFs have identical sample sets and disjoint calls so that one can simply perform a merge sort to combine the VCFs into one, drastically reducing the runtime.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
167 minimumN Combine variants and output site only if variant is present in at least N input files.
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
168
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
169 @CITATION_SECTION@
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
170 </help>
931e358ece8d Imported from capsule None
devteam
parents:
diff changeset
171 </tool>