Mercurial > repos > iuc > gatk2
annotate variant_select.xml @ 11:0d369d08ad6e draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
| author | iuc |
|---|---|
| date | Mon, 04 May 2015 22:47:06 -0400 |
| parents | b80301676614 |
| children | 669a23f1f4b5 |
| rev | line source |
|---|---|
| 6 | 1 <tool id="gatk2_variant_select" name="Select Variants" version="@VERSION@.0"> |
| 0 | 2 <description>from VCF files</description> |
| 3 <macros> | |
| 4 <import>gatk2_macros.xml</import> | |
| 5 </macros> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
6 <expand macro="requirements" /> |
|
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
7 <expand macro="version_command" /> |
| 1 | 8 <command interpreter="python"> |
| 9 #from binascii import hexlify | |
| 10 | |
| 11 gatk2_wrapper.py | |
| 0 | 12 --stdout "${output_log}" |
| 13 -d "--variant:variant,%(file_type)s" "${reference_source.input_variant}" "${reference_source.input_variant.ext}" "input_variant" | |
| 14 -p ' | |
| 15 @JAR_PATH@ | |
| 16 -T "SelectVariants" | |
| 17 \$GATK2_SITE_OPTIONS | |
| 18 | |
| 19 @THREADS@ | |
| 20 -o "${output_vcf}" | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
21 |
| 0 | 22 #if $reference_source.reference_source_selector != "history": |
| 23 -R "${reference_source.ref_file.fields.path}" | |
| 24 #end if | |
| 25 ' | |
| 26 -p ' | |
| 27 #if $input_concordance: | |
| 28 --concordance "${input_concordance}" | |
| 29 #end if | |
| 30 #if $input_discordance: | |
| 31 --discordance "${input_discordance}" | |
| 32 #end if | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
33 |
| 0 | 34 #for $exclude_sample_name in $exclude_sample_name_repeat: |
| 35 --exclude_sample_name "${exclude_sample_name.exclude_sample_name}" | |
| 36 #end for | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
37 |
| 0 | 38 ${exclude_filtered} |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
39 |
| 0 | 40 #for $sample_name in $sample_name_repeat: |
| 41 --sample_name "${sample_name.sample_name}" | |
| 42 #end for | |
| 43 ' | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
44 |
| 0 | 45 #for $select_expressions in $select_expressions_repeat: |
| 46 #set $select_expression = "--select_expressions '%s'" % ( str( $select_expressions.select_expressions ) ) | |
| 47 -o '${ hexlify( $select_expression ) }' | |
| 48 #end for | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
49 |
| 0 | 50 ##start tool specific options |
| 51 #if str( $analysis_param_type.analysis_param_type_selector ) == 'advanced': | |
| 52 -p ' | |
| 53 #for $exclude_sample_file in $analysis_param_type.exclude_sample_file_repeat: | |
| 54 --exclude_sample_file "${exclude_sample_file.exclude_sample_file}" | |
| 55 #end for | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
56 |
| 0 | 57 #for $sample_file in $analysis_param_type.sample_file_repeat: |
| 58 --sample_file "${ample_file.sample_file}" | |
| 59 #end for | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
60 |
| 0 | 61 #if $analysis_param_type.input_keep_ids: |
| 62 --keepIDs "${analysis_param_type.input_keep_ids}" | |
| 63 #end if | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
64 |
| 0 | 65 ${analysis_param_type.keep_original_AC} |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
66 |
| 0 | 67 ${analysis_param_type.mendelian_violation} |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
68 |
| 0 | 69 --mendelianViolationQualThreshold "${analysis_param_type.mendelian_violation_qual_threshold}" |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
70 |
| 0 | 71 --remove_fraction_genotypes "${analysis_param_type.remove_fraction_genotypes}" |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
72 |
| 0 | 73 --restrictAllelesTo "${analysis_param_type.restrict_alleles_to}" |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
74 |
| 0 | 75 #if str( $analysis_param_type.select_random_type.select_random_type_selector ) == 'select_random_fraction': |
| 76 --select_random_fraction "${analysis_param_type.select_random_type.select_random_fraction}" | |
| 77 #elif str( $analysis_param_type.select_random_type.select_random_type_selector ) == 'select_random_number': | |
| 78 --select_random_number "${analysis_param_type.select_random_type.select_random_number}" | |
| 79 #end if | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
80 |
| 0 | 81 #if $analysis_param_type.select_type_to_include: |
| 82 #for $type_to_include in str( $analysis_param_type.select_type_to_include ).split( ',' ): | |
| 83 --selectTypeToInclude "${type_to_include}" | |
| 84 #end for | |
| 85 #end if | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
86 |
| 0 | 87 ${analysis_param_type.exclude_non_variants} |
| 88 ' | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
89 |
| 0 | 90 #for $sample_expressions in $analysis_param_type.sample_expressions_repeat: |
| 91 #set $sample_expression = "--sample_expressions '%s'" % ( str( $sample_expressions.sample_expressions ) ) | |
| 92 -o '${ hexlify( $sample_expression ) }' | |
| 93 #end for | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
94 |
| 0 | 95 #end if |
| 96 ##end tool specific options | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
97 |
| 0 | 98 #include source=$standard_gatk_options# |
| 99 </command> | |
| 100 <inputs> | |
| 101 <conditional name="reference_source"> | |
| 102 <expand macro="reference_source_selector_param" /> | |
| 103 <when value="cached"> | |
| 104 <param name="input_variant" type="data" format="vcf" label="Variant file to select" help="-V,--variant &lt;variant&gt;" /> | |
| 105 <param name="ref_file" type="select" label="Using reference genome" help="-R,--reference_sequence &lt;reference_sequence&gt;"> | |
| 106 <options from_data_table="gatk2_picard_indexes"> | |
| 107 <filter type="data_meta" key="dbkey" ref="input_variant" column="dbkey"/> | |
| 108 </options> | |
| 109 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/> | |
| 110 </param> | |
| 111 </when> | |
| 112 <when value="history"> <!-- FIX ME!!!! --> | |
| 113 <param name="input_variant" type="data" format="vcf" label="Variant file to select" help="-V,--variant &lt;variant&gt;" /> | |
| 114 <param name="ref_file" type="data" format="fasta" label="Using reference file" help="-R,--reference_sequence &lt;reference_sequence&gt;" /> | |
| 115 </when> | |
| 116 </conditional> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
117 |
| 0 | 118 <repeat name="select_expressions_repeat" title="Criteria to use when selecting the data" help="-select,--select_expressions &lt;select_expressions&gt;"> |
| 119 <param name="select_expressions" type="text" label="JEXL expression"> | |
| 120 <sanitizer> | |
| 121 <valid initial="string.printable"> | |
| 122 <remove value="'"/> | |
| 123 </valid> | |
| 124 <mapping initial="none"/> | |
| 125 </sanitizer> | |
| 126 </param> | |
| 127 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
128 |
| 0 | 129 <param name="input_concordance" type="data" format="vcf" label="Output variants that were also called in this comparison track" optional="True" help="-conc,--concordance &lt;concordance&gt;"/> |
| 130 <param name="input_discordance" type="data" format="vcf" label="Output variants that were not called in this comparison track" optional="True" help="-disc,--discordance &lt;discordance&gt;"/> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
131 |
| 0 | 132 <repeat name="sample_name_repeat" title="Include Samples by name" help="-sn,--sample_name &lt;sample_name&gt;"> |
| 133 <param name="sample_name" type="text" label="Include genotypes from this sample"/> | |
| 134 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
135 |
| 0 | 136 <repeat name="exclude_sample_name_repeat" title="Exclude Samples by name" help="-xl_sn,--exclude_sample_name &lt;exclude_sample_name&gt;"> |
| 137 <param name="exclude_sample_name" type="text" label="Exclude genotypes from this sample"/> | |
| 138 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
139 |
| 0 | 140 <param name="exclude_filtered" type="boolean" truevalue="--excludeFiltered" falsevalue="" label="Don't include filtered loci in the analysis" help="-ef,--excludeFiltered" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
141 |
| 0 | 142 <expand macro="gatk_param_type_conditional" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
143 |
| 0 | 144 <expand macro="analysis_type_conditional"> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
145 |
| 0 | 146 <repeat name="exclude_sample_file_repeat" title="Exclude Samples by file" help="-xl_sf,--exclude_sample_file &lt;exclude_sample_file&gt;"> |
| 147 <param name="exclude_sample_file" type="data" format="txt" label="File containing a list of samples (one per line) to exclude"/> | |
| 148 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
149 |
| 0 | 150 <repeat name="sample_file_repeat" title="Samples by file" help="-sf,--sample_file &lt;sample_file&gt;"> |
| 151 <param name="sample_file" type="data" format="txt" label="File containing a list of samples (one per line) to include" /> | |
| 152 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
153 |
| 0 | 154 <param name="input_keep_ids" type="data" format="text" label="Only emit sites whose ID is found in this file" optional="True" help="-IDs,--keepIDs &lt;keepIDs&gt;"/> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
155 |
| 0 | 156 <param name="keep_original_AC" type="boolean" truevalue="--keepOriginalAC" falsevalue="" label="Don't update the AC, AF, or AN values in the INFO field after selecting" help="-keepOriginalAC,--keepOriginalAC" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
157 |
| 0 | 158 <param name="mendelian_violation" type="boolean" truevalue="--mendelianViolation" falsevalue="" label="output mendelian violation sites only" help="-mv,--mendelianViolation" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
159 |
| 0 | 160 <param name="mendelian_violation_qual_threshold" type="float" label="Minimum genotype QUAL score for each trio member required to accept a site as a mendelian violation" value="0" help="-mvq,--mendelianViolationQualThreshold &lt;mendelianViolationQualThreshold&gt;" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
161 |
| 0 | 162 <param name="remove_fraction_genotypes" type="float" label="Selects a fraction (a number between 0 and 1) of the total genotypes at random from the variant track and sets them to nocall" value="0" min="0" max="1" help="-fractionGenotypes,--remove_fraction_genotypes &lt;remove_fraction_genotypes&gt;" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
163 |
| 0 | 164 <param name="restrict_alleles_to" type="select" label="Select only variants of a particular allelicity" help="-restrictAllelesTo,--restrictAllelesTo &lt;restrictAllelesTo&gt;"> |
| 165 <option value="ALL" selected="True">ALL</option> | |
| 166 <option value="MULTIALLELIC">MULTIALLELIC</option> | |
| 167 <option value="BIALLELIC">BIALLELIC</option> | |
| 168 </param> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
169 |
| 0 | 170 <repeat name="sample_expressions_repeat" title="Regular expression to select many samples from the ROD tracks provided" help="-se,--sample_expressions &lt;sample_expressions&gt;"> |
| 171 <param name="sample_expressions" type="text" label="Regular expression"> | |
| 172 <sanitizer> | |
| 173 <valid initial="string.printable"> | |
| 174 <remove value="'"/> | |
| 175 </valid> | |
| 176 <mapping initial="none"/> | |
| 177 </sanitizer> | |
| 178 </param> | |
| 179 </repeat> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
180 |
| 0 | 181 <conditional name="select_random_type"> |
| 182 <param name="select_random_type_selector" type="select" label="Select a random subset of variants"> | |
| 183 <option value="select_all" selected="True">Use all variants</option> | |
| 184 <option value="select_random_fraction">Select random fraction</option> | |
| 185 <option value="select_random_number">Select random number</option> | |
| 186 </param> | |
| 187 <when value="select_all"> | |
| 188 <!-- Do nothing here --> | |
| 189 </when> | |
| 190 <when value="select_random_fraction"> | |
| 191 <param name="select_random_fraction" type="float" value="0" label="Fraction" min="0" max="1" help="-fraction,--select_random_fraction &lt;select_random_fraction&gt;"/> | |
| 192 </when> | |
| 193 <when value="select_random_number"> | |
| 194 <param name="select_random_number" type="integer" value="0" label="Count" help="-number,--select_random_number &lt;select_random_number&gt;" /> | |
| 195 </when> | |
| 196 </conditional> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
197 |
| 0 | 198 <param name="exclude_non_variants" type="boolean" truevalue="--excludeNonVariants" falsevalue="" label="Don't include loci found to be non-variant after the subsetting procedure" help="-env,--excludeNonVariants" /> |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
199 |
| 0 | 200 <param name="select_type_to_include" type="select" label="Select only a certain type of variants from the input file" multiple="True" display="checkboxes" help="-selectType,--selectTypeToInclude &lt;selectTypeToInclude&gt;"> |
| 201 <option value="INDEL">INDEL</option> | |
| 202 <option value="SNP">SNP</option> | |
| 203 <option value="MIXED">MIXED</option> | |
| 204 <option value="MNP">MNP</option> | |
| 205 <option value="SYMBOLIC">SYMBOLIC</option> | |
| 206 <option value="NO_VARIATION">NO_VARIATION</option> | |
| 207 </param> | |
| 208 </expand> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
209 |
| 0 | 210 </inputs> |
| 211 <outputs> | |
| 212 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (Variant File)" /> | |
| 213 <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" /> | |
| 214 </outputs> | |
| 215 <tests> | |
| 216 <test> | |
| 217 <param name="reference_source_selector" value="history" /> | |
| 218 <param name="ref_file" value="phiX.fasta" ftype="fasta" /> | |
| 219 <param name="input_variant" value="gatk/gatk_variant_annotator/gatk_variant_annotator_out_1.vcf" ftype="vcf" /> | |
| 220 <param name="select_expressions_repeat" value="0" /> | |
| 221 <param name="input_concordance" /> | |
| 222 <param name="input_discordance" /> | |
| 223 <param name="exclude_sample_name_repeat" value="0" /> | |
| 224 <param name="exclude_filtered" /> | |
| 225 <param name="sample_name_repeat" value="0" /> | |
| 226 <param name="gatk_param_type_selector" value="basic" /> | |
| 227 <param name="analysis_param_type_selector" value="basic" /> | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
228 <output name="output_vcf" file="gatk/gatk_variant_select/gatk_variant_select_out_1.vcf" lines_diff="4" /> |
| 0 | 229 <output name="output_log" file="gatk/gatk_variant_select/gatk_variant_select_out_1.log.contains" compare="contains" /> |
| 230 </test> | |
| 231 </tests> | |
| 232 <help> | |
| 233 **What it does** | |
| 234 | |
|
11
0d369d08ad6e
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk2 commit 344140b8df53b8b7024618bb04594607a045c03a
iuc
parents:
6
diff
changeset
|
235 Often, a VCF containing many samples and/or variants will need to be subset in order to facilitate certain analyses (e.g. comparing and contrasting cases vs. controls; extracting variant or non-variant loci that meet certain requirements, displaying just a few samples in a browser like IGV, etc.). SelectVariants can be used for this purpose. Given a single VCF file, one or more samples can be extracted from the file (based on a complete sample name or a pattern match). Variants can be further selected by specifying criteria for inclusion, i.e. "DP > 1000" (depth of coverage greater than 1000x), "AF < 0.25" (sites with allele frequency less than 0.25). These JEXL expressions are documented in the `Using JEXL expressions section <http://gatkforums.broadinstitute.org/discussion/1255/what-are-jexl-expressions-and-how-can-i-use-them-with-the-gatk>`_. One can optionally include concordance or discordance tracks for use in selecting overlapping variants. |
| 0 | 236 |
| 237 For more information on using the SelectVariants module, see this `tool specific page <http://www.broadinstitute.org/gatk/gatkdocs/org_broadinstitute_sting_gatk_walkers_variantutils_SelectVariants.html>`_. | |
| 238 | |
| 239 To learn about best practices for variant detection using GATK, see this `overview <http://www.broadinstitute.org/gatk/guide/topic?name=best-practices>`_. | |
| 240 | |
| 241 If you encounter errors, please view the `GATK FAQ <http://www.broadinstitute.org/gatk/guide/topic?name=faqs>`_. | |
| 242 | |
| 243 ------ | |
| 244 | |
| 245 **Inputs** | |
| 246 | |
| 247 GenomeAnalysisTK: SelectVariants accepts a VCF input file. | |
| 248 | |
| 249 | |
| 250 **Outputs** | |
| 251 | |
| 252 The output is in VCF format. | |
| 253 | |
| 254 | |
| 255 Go `here <http://www.broadinstitute.org/gatk/guide/topic?name=intro>`_ for details on GATK file formats. | |
| 256 | |
| 257 ------- | |
| 258 | |
| 259 **Settings**:: | |
| 260 | |
| 261 | |
| 262 out VCFWriter stdout File to which variants should be written | |
| 263 variant RodBinding[VariantContext] NA Input VCF file | |
| 264 concordance RodBinding[VariantContext] none Output variants that were also called in this comparison track | |
| 265 discordance RodBinding[VariantContext] none Output variants that were not called in this comparison track | |
| 266 exclude_sample_file Set[File] [] File containing a list of samples (one per line) to exclude. Can be specified multiple times | |
| 267 exclude_sample_name Set[String] [] Exclude genotypes from this sample. Can be specified multiple times | |
| 268 excludeFiltered boolean false Don't include filtered loci in the analysis | |
| 269 excludeNonVariants boolean false Don't include loci found to be non-variant after the subsetting procedure | |
| 270 keepIDs File NA Only emit sites whose ID is found in this file (one ID per line) | |
| 271 keepOriginalAC boolean false Don't update the AC, AF, or AN values in the INFO field after selecting | |
| 272 mendelianViolation Boolean false output mendelian violation sites only | |
| 273 mvq double 0.0 Minimum genotype QUAL score for each trio member required to accept a site as a violation | |
| 274 remove_fraction_genotypes double 0.0 Selects a fraction (a number between 0 and 1) of the total genotypes at random from the variant track and sets them to nocall | |
| 275 restrictAllelesTo NumberAlleleRestriction ALL Select only variants of a particular allelicity. Valid options are ALL (default), MULTIALLELIC or BIALLELIC | |
| 276 sample_expressions Set[String] NA Regular expression to select many samples from the ROD tracks provided. Can be specified multiple times | |
| 277 sample_file Set[File] NA File containing a list of samples (one per line) to include. Can be specified multiple times | |
| 278 sample_name Set[String] [] Include genotypes from this sample. Can be specified multiple times | |
| 279 select_expressions ArrayList[String] [] One or more criteria to use when selecting the data | |
| 280 select_random_fraction double 0.0 Selects a fraction (a number between 0 and 1) of the total variants at random from the variant track | |
| 281 select_random_number int 0 Selects a number of variants at random from the variant track | |
| 282 selectTypeToInclude List[Type] [] Select only a certain type of variants from the input file. Valid types are INDEL, SNP, MIXED, MNP, SYMBOLIC, NO_VARIATION. Can be specified multiple times | |
| 283 | |
| 284 @CITATION_SECTION@ | |
| 285 </help> | |
| 6 | 286 <expand macro="citations" /> |
| 0 | 287 </tool> |
