view testing_cgatools-982e19c29ec0/cgatools/tools/cgatools_1.6/mkvcf.xml @ 0:ef23f9cd599b draft default tip

Uploaded
author devteam
date Thu, 27 Sep 2012 13:37:59 -0400
parents
children
line wrap: on
line source

<tool id="cg_mkvcf" name="mkvcf(beta) 1.6" version="1.0.0">
<!--
This tool creates a GUI for the mkvcf function of cgatools from Complete Genomics, Inc.
written 7-31-2012 by bcrain@completegenomics.com
-->

  <description>converts to vcf</description>

  <command interpreter="perl">
  	<!--run wrapper script-->
  	mkvcf_wrapper.pl
  	--reference $crr.fields.path
  	--output $output
  	--genomes $count.genomes
		--source $count.sources.source
		--datasource $count.sources.data_sources.data_source
		#if $count.sources.data_sources.data_source=="in"
			#for $m in $count.sources.data_sources.files
				--input $m.input
			#end for
		#else
			--input $count.sources.data_sources.input
		#end if
		#if $count.sources.source=="masterVar" or $count.sources.source=="masterVar,CNV"
	  	$count.sources.nocalls
	  	--calibration $count.sources.calibration
	  #else if $count.sources.source=="SV"
			--jctscore $count.sources.jctscore
			--jctside $count.sources.jctside
			--jctdistance $count.sources.jctdistance
			--jctlength $count.sources.jctlength
			$count.sources.jctpriority
			$count.sources.jcttumor
	  #else if $count.sources.source=="masterVar,CNV,SV" or $count.sources.source=="masterVar,CNV,SV,MEI"
	  	$count.sources.nocalls
	  	--calibration $count.sources.calibration
			--jctscore $count.sources.jctscore
			--jctside $count.sources.jctside
			--jctdistance $count.sources.jctdistance
			--jctlength $count.sources.jctlength
			$count.sources.jctpriority
			$count.sources.jcttumor
	  #end if
	  	--fields $count.sources.fields
  </command>

  <outputs>
    <data format="vcf" name="output" label="${tool.name} output"/>
  </outputs>
  
  <inputs>
  	<!--form field to select crr file-->
    <param name="crr" type="select" label="Reference genome (.crr file)">
      <options from_data_table="cg_crr_files" />
    </param>
    
    <!--select number of genomes - determines which input sources to show-->
    <conditional name="count">
    	<param name="genomes" type="select" label="Select the number of genomes to add to the vcf file" help="Note: multi-genome vcfs (2 or more genomes) can only be generated for format version 2.0 and up">
				<option value="1" selected="true">1 - allowed data sources are masterVar, CNV, SV, MEI</option>
				<option value="2">2 - allowed data sources are masterVar, CNV, SV (format v2.x)</option>
				<option value="3">3 or more - allowed data sources are masterVar, CNV (format v2.x)</option>
			</param>
    	
			<when value="1">
				<!--form field to select input sources-->
				<conditional name="sources">
					<param name="source" type="select" label="Data sources to be included for this genome">
						<option value="masterVar,CNV,SV,MEI" selected="true">masterVar + CNV + SV + MEI</option>
						<option value="masterVar">masterVar</option>
						<option value="CNV">CNV</option>
						<option value="SV">SV</option>
						<option value="MEI">MEI</option>
					</param>
					
					<when value="masterVar,CNV,SV,MEI">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="Genome root directory" size="200" help="Enter full path /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the genome root directory"/>
								</param>
							</when>
						</conditional>
					
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>

						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>
						
						<!--form fields junction threshold options-->
						<param name="jctscore" type="integer" value="10" label="Junction score thresholds (discordant mate pair count) (default 10)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 10" />
						</param>
						<param name="jctside" type="integer" value="70" label="Junction side length threshold (default 70)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 70" />
						</param>
						<param name="jctdistance" type="integer" value="200" label="Distance tolerance for junction compatibility (default 200)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 200" />
						</param>
						<param name="jctlength" type="integer" value="500" label="Length threshold for compatible junctions (default 500)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 500" />
						</param>
				
						<!--form field to select junction confidence in tumors-->
						<param name="jctpriority" type="select" label="Use normal junction priority for vcf output?">
							<option value="" selected="true">no</option>
							<option value="--jctpriority">yes</option>
						</param>
				 
						<!--form field to select junction confidence in tumors-->
						<param name="jcttumor" type="select" label="Use high confidence junctions for tumors?">
							<option value="" selected="true">no</option>
							<option value="--jcttumor">yes</option>
						</param>

						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment including this interval</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
							<option value="SVTYPE">SVTYPE - Type of structural variation</option>
							<option value="CGA_BF">CGA_BF - Frequency in set of baseline genomes</option>
							<option value="CGA_MEDEL">CGA_MEDEL - Mobile element deletion</option>
							<option value="MATEID">MATEID - ID of mate breakend</option>
							<option value="CGA_BNDG">CGA_BNDG - Transcript name and strand of genes containing breakend</option>
							<option value="CGA_BNDGO">CGA_BNDGO - Transcript name and strand of genes containing mate breakend</option>
							<option value="CGA_BNDP">CGA_BNDP - Precision of breakend</option>
							<option value="CGA_BNDMPC">CGA_BNDMPC - Mate pair count supporting a breakend</option>
							<option value="CGA_BNDPOS">CGA_BNDPOS - Position of breakend as detected in individual genome</option>
							<option value="CGA_BNDDEF">CGA_BNDDEF - Breakend definition in individual genome</option>
							<option value="CGA_IS">CGA_IS - Measure of confidence that there is a mobile element insertion</option>
							<option value="CGA_IDC">CGA_IDC - Count of paired ends consistently indicating a mobile element insertion</option>
							<option value="CGA_IDCL">CGA_IDCL - Count of paired ends indicating a mobile element insertion anchored 5&#39;</option>
							<option value="CGA_IDCR">CGA_IDCR - Count of paired ends indicating a mobile element insertion anchored 3&#39;</option>
							<option value="CGA_RDC">CGA_RDC - Count of paired ends supporting the presence of a reference allele</option>
							<option value="CGA_NBET">CGA_NBET - Next-best estimate of type of MEI</option>
							<option value="CGA_ETS">CGA_ETS - Measure of confidence that the ElementType (MEINFO:NAME) is correct</option>
							<option value="CGA_KES">CGA_KES - Fraction of known MEI with at least as good an InsertionScore</option>
						</param>
					</when>

					<when value="masterVar">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where is the input file?">
								<option value="in" selected="true">imported into Galaxy</option>
								<option value="out">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="in">
								<!--form field to select mastervar files-->
								<repeat name="files" title="MasterVar file" min="1" max="1">
									<param name="input" type="data" format="cg_mastervar" label="Dataset">
										<validator type="dataset_ok_validator" />
										<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
										 metadata_name="dbkey" metadata_column="1"
										 message="cgatools is not currently available for this build."/>
									</param>
								</repeat>
							</when>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="Genome root directory or masterVar file" size="200" help="Enter full path /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01), or /path/masterVarfile (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01/ASM/masterVarBeta-GS00000YYYY-ASM.tsv.bz2).">
									<validator type="empty_field" message="You must supply the genome root directory or masterVar file"/>
								</param>
							</when>
						</conditional>
									
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>
						
						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>

						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
						</param>
					</when>
					
					<when value="CNV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="Genome root directory" size="200" help="Enter full path /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the genome root directory"/>
								</param>
							</when>
						</conditional>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="GT">GT - Genotype</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
						</param>
					</when>
					
					<when value="SV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="in" selected="true">imported into Galaxy</option>
								<option value="out">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="in">
								<!--form field to select SV file-->
								<repeat name="files" title="SV file" min="1" max="1">
									<param name="input" type="data" format="tabular" label="Dataset">
										<validator type="dataset_ok_validator" />
										<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
										 metadata_name="dbkey" metadata_column="1"
										 message="cgatools is not currently available for this build."/>
									</param>
								</repeat>
							</when>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="Genome root directory or SV file" size="200" help="Enter full path /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01), or /path/SVfile (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01/ASM/SV/allJunctionsBeta-GS00000YYYY-ASM.tsv).">
									<validator type="empty_field" message="You must supply the genome root directory or SV file"/>
								</param>
							</when>
						</conditional>
									
						<!--form fields junction threshold options-->
						<param name="jctscore" type="integer" value="10" label="Junction score thresholds (discordant mate pair count) (default 10)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 10" />
						</param>
						<param name="jctside" type="integer" value="70" label="Junction side length threshold (default 70)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 70" />
						</param>
						<param name="jctdistance" type="integer" value="200" label="Distance tolerance for junction compatibility (default 200)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 200" />
						</param>
						<param name="jctlength" type="integer" value="500" label="Length threshold for compatible junctions (default 500)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 500" />
						</param>
				
						<!--form field to select junction confidence in tumors-->
						<param name="jctpriority" type="select" label="Use normal junction priority for vcf output?">
							<option value="" selected="true">no</option>
							<option value="--jctpriority">yes</option>
						</param>
				 
						<!--form field to select junction confidence in tumors-->
						<param name="jcttumor" type="select" label="Use high confidence junctions for tumors?">
							<option value="" selected="true">no</option>
							<option value="--jcttumor">yes</option>
						</param>

						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
				      <option value="GT">GT - Genotype</option>
				      <option value="FT">FT - Sample genotype filters</option>
							<option value="NS">NS - Number of samples</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="SVTYPE">SVTYPE - Type of structural variation</option>
							<option value="CGA_BF">CGA_BF - Frequency in set of baseline genomes</option>
							<option value="CGA_MEDEL">CGA_MEDEL - Mobile element deletion</option>
							<option value="MATEID">MATEID - ID of mate breakend</option>
							<option value="CGA_BNDG">CGA_BNDG - Transcript name and strand of genes containing breakend</option>
							<option value="CGA_BNDGO">CGA_BNDGO - Transcript name and strand of genes containing mate breakend</option>
							<option value="CGA_BNDP">CGA_BNDP - Precision of breakend</option>
							<option value="CGA_BNDMPC">CGA_BNDMPC - Mate pair count supporting a breakend</option>
							<option value="CGA_BNDPOS">CGA_BNDPOS - Position of breakend as detected in individual genome</option>
							<option value="CGA_BNDDEF">CGA_BNDDEF - Breakend definition in individual genome</option>
						</param>
					</when>
					
					<when value="MEI">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy</option>
							</param>
							
							<when value="out">
								<!--form field to select outside list of genome directories or mastervar files-->
								<param name="input" type="text" label="Genome root directory" size="200" help="Enter full path /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the genome root directory"/>
								</param>
							</when>
						</conditional>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
				      <option value="GT">GT - Genotype</option>
				      <option value="FT">FT - Sample genotype filters</option>
							<option value="CGA_IS">CGA_IS - Measure of confidence that there is a mobile element insertion</option>
							<option value="CGA_IDC">CGA_IDC - Count of paired ends consistently indicating a mobile element insertion</option>
							<option value="CGA_IDCL">CGA_IDCL - Count of paired ends indicating a mobile element insertion, anchored 5&#39;</option>
							<option value="CGA_IDCR">CGA_IDCR - Count of paired ends indicating a mobile element insertion, anchored 3&#39;</option>
							<option value="CGA_RDC">CGA_RDC - Count of paired ends supporting the presence of a reference allele</option>
							<option value="CGA_NBET">CGA_NBET - Next-best estimate of type of MEI</option>
							<option value="CGA_ETS">CGA_ETS - Measure of confidence that the ElementType (MEINFO:NAME) is correct</option>
							<option value="CGA_KES">CGA_KES - Fraction of known MEI with at least as good an InsertionScore</option>
						</param>
					</when>

				</conditional>
			</when>
			
			<when value="2">
				<!--form field to select input sources-->
				<conditional name="sources">
					<param name="source" type="select" label="Data sources to be included for each genome">
						<option value="masterVar,CNV,SV" selected="true">masterVar + CNV + SV</option>
						<option value="masterVar">masterVar</option>
						<option value="CNV">CNV</option>
						<option value="SV">SV</option>
					</param>

					<when value="masterVar,CNV,SV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01). For normal/tumor comparisons list the baseline genome first.">
									<validator type="empty_field" message="You must supply the list of genome root directories"/>
								</param>
							</when>
						</conditional>
					
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>
						
						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>

						<!--form fields junction threshold options-->
						<param name="jctscore" type="integer" value="10" label="Junction score thresholds (discordant mate pair count) (default 10)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 10" />
						</param>
						<param name="jctside" type="integer" value="70" label="Junction side length threshold (default 70)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 70" />
						</param>
						<param name="jctdistance" type="integer" value="200" label="Distance tolerance for junction compatibility (default 200)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 200" />
						</param>
						<param name="jctlength" type="integer" value="500" label="Length threshold for compatible junctions (default 500)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 500" />
						</param>
				
						<!--form field to select junction confidence in tumors-->
						<param name="jctpriority" type="select" label="Use normal junction priority for vcf output?">
							<option value="" selected="true">no</option>
							<option value="--jctpriority">yes</option>
						</param>
				 
						<!--form field to select junction confidence in tumors-->
						<param name="jcttumor" type="select" label="Use high confidence junctions for tumors?">
							<option value="" selected="true">no</option>
							<option value="--jcttumor">yes</option>
						</param>
		
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
							<option value="SVTYPE">SVTYPE - Type of structural variation</option>
							<option value="CGA_BF">CGA_BF - Frequency in set of baseline genomes</option>
							<option value="CGA_MEDEL">CGA_MEDEL - Mobile element deletion</option>
							<option value="MATEID">MATEID - ID of mate breakend</option>
							<option value="CGA_BNDG">CGA_BNDG - Transcript name and strand of genes containing breakend</option>
							<option value="CGA_BNDGO">CGA_BNDGO - Transcript name and strand of genes containing mate breakend</option>
							<option value="CGA_BNDP">CGA_BNDP - Precision of breakend</option>
							<option value="CGA_BNDMPC">CGA_BNDMPC - Mate pair count supporting a breakend</option>
							<option value="CGA_BNDPOS">CGA_BNDPOS - Position of breakend as detected in individual genome</option>
							<option value="CGA_BNDDEF">CGA_BNDDEF - Breakend definition in individual genome</option>
						</param>
 					</when>
					
					<when value="masterVar">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="in" selected="true">imported into Galaxy</option>
								<option value="out">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="in">
								<!--form field to select input files-->
								<repeat name="files" title="MasterVar file" min="1" max="2">
									<param name="input" type="data" format="cg_mastervar" label="Dataset">
										<validator type="dataset_ok_validator"/>
										<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
										 metadata_name="dbkey" metadata_column="1"
										 message="cgatools is not currently available for this build."/>
									</param>
								</repeat>
							</when>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories or masterVar files" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01), or a list of masterVar files, one per line in the format /path/masterVarfile (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01/ASM/masterVarBeta-GS00000YYYY-ASM.tsv.bz2).">
									<validator type="empty_field" message="You must supply the list of genome root directories or masterVar files"/>
								</param>
							</when>
						</conditional>
									
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>

						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
						</param>
					</when>
					
					<when value="CNV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the list of genome root directories"/>
								</param>
							</when>
						</conditional>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="GT">GT - Genotype</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
						</param>
					</when>
					
					<when value="SV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="in" selected="true">imported into Galaxy</option>
								<option value="out">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="in">
								<!--form field to select mastervar files-->
								<repeat name="files" title="SV files" min="1" max="2">
									<param name="input" type="data" format="tabular" label="Dataset">
										<validator type="dataset_ok_validator" />
										<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
										 metadata_name="dbkey" metadata_column="1"
										 message="cgatools is not currently available for this build."/>
									</param>
								</repeat>
							</when>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories or SV files" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01), or a list of SV files, one per line in the format /path/SVfile (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01/ASM/SV/allJunctionsBeta-GS00000YYYY-ASM.tsv).">
									<validator type="empty_field" message="You must supply the list of genome root directories or SV files"/>
								</param>
							</when>
						</conditional>
									
						<!--form fields junction threshold options-->
						<param name="jctscore" type="integer" value="10" label="Junction score thresholds (discordant mate pair count) (default 10)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 10" />
						</param>
						<param name="jctside" type="integer" value="70" label="Junction side length threshold (default 70)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 70" />
						</param>
						<param name="jctdistance" type="integer" value="200" label="Distance tolerance for junction compatibility (default 200)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 200" />
						</param>
						<param name="jctlength" type="integer" value="500" label="Length threshold for compatible junctions (default 500)">
							<validator type="empty_field" message="You must enter a value, for the default value enter 500" />
						</param>
				
						<!--form field to select junction confidence in tumors-->
						<param name="jctpriority" type="select" label="Use normal junction priority for vcf output?">
							<option value="" selected="true">no</option>
							<option value="--jctpriority">yes</option>
						</param>
				 
						<!--form field to select junction confidence in tumors-->
						<param name="jcttumor" type="select" label="Use high confidence junctions for tumors?">
							<option value="" selected="true">no</option>
							<option value="--jcttumor">yes</option>
						</param>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
				      <option value="GT">GT - Genotype</option>
				      <option value="FT">FT - Sample genotype filters</option>
							<option value="SVTYPE">SVTYPE - Type of structural variation</option>
							<option value="CGA_BF">CGA_BF - Frequency in set of baseline genomes</option>
							<option value="CGA_MEDEL">CGA_MEDEL - Mobile element deletion</option>
							<option value="MATEID">MATEID - ID of mate breakend</option>
							<option value="CGA_BNDG">CGA_BNDG - Transcript name and strand of genes containing breakend</option>
							<option value="CGA_BNDGO">CGA_BNDGO - Transcript name and strand of genes containing mate breakend</option>
							<option value="CGA_BNDP">CGA_BNDP - Precision of breakend</option>
							<option value="CGA_BNDMPC">CGA_BNDMPC - Mate pair count supporting a breakend</option>
							<option value="CGA_BNDPOS">CGA_BNDPOS - Position of breakend as detected in individual genome</option>
							<option value="CGA_BNDDEF">CGA_BNDDEF - Breakend definition in individual genome</option>
						</param>
					</when>
				</conditional>
			</when>

			<when value="3">
				<!--form field to select input sources-->
				<conditional name="sources">
					<param name="source" type="select" label="Data sources to be included for each genome">
						<option value="masterVar,CNV" selected="true">masterVar + CNV</option>
						<option value="masterVar">masterVar</option>
						<option value="CNV">CNV</option>
					</param>
					
					<when value="masterVar,CNV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to select outside list of genome directories or mastervar files-->
								<param name="input" type="text" label="File with list of genome root directories" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the list of genome root directories"/>
								</param>
							</when>
						</conditional>
					
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>
						
						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>

						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
						</param>
					</when>
					
					<when value="masterVar">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="in" selected="true">imported into Galaxy</option>
								<option value="out">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="in">
								<!--form field to select mastervar files-->
								<repeat name="files" title="MasterVar files" min="1">
									<param name="input" type="data" format="cg_mastervar" label="Dataset">
										<validator type="dataset_ok_validator" />
										<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
										 metadata_name="dbkey" metadata_column="1"
										 message="cgatools is not currently available for this build."/>
									</param>
								</repeat>
							</when>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories or masterVar files" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01), or a list of masterVar files, one per line in the format /path/masterVarfile (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01/ASM/masterVarBeta-GS00000YYYY-ASM.tsv.bz2).">
									<validator type="empty_field" message="You must supply the list of genome root directories or masterVar files"/>
								</param>
							</when>
						</conditional>
									
						<!--form field to select no-calls-->
						<param name="nocalls" type="select" label="Include no-calls?">
							<option value="" selected="true">no</option>
							<option value="--nocalls">yes</option>
						</param>
						
						<!--form field to enter calibration directory-->
						<param name="calibration" type="text" size="300" label="Directory calibration data (/path/calibration-root)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v2.tgz"/>

						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="NS">NS - Number of samples</option>
							<option value="AN">AN - Total number of alleles in called genotypes</option>
							<option value="AC">AC - Allele count in genotypes</option>
							<option value="CGA_XR">CGA_XR - External database reference</option>
							<option value="CGA_FI">CGA_FI - Functional impact</option>
							<option value="CGA_PFAM">CGA_PFAM - PFAM domain </option>
							<option value="CGA_MIRB">CGA_MIRB - miRBaseId</option>
							<option value="CGA_SDO">CGA_SDO - Depth of overlapping segmental duplications</option>
							<option value="CGA_RPT">CGA_RPT - Overlapping repeatMasker annotations</option>
							<option value="GT">GT - Genotype</option>
							<option value="PS">PS - Phase set</option>
							<option value="FT">FT - Sample genotype filters</option>
							<option value="GL">GL - Genotype likelihoods</option>
							<option value="CGA_CEHQ">CGA_CEHQ - Calibrated haplotype quality based on EAF assumption</option>
							<option value="CGA_CEGL">CGA_CEGL - Genotype likelihoods based on CEHQ</option>
							<option value="SS">SS - Somatic status</option>
							<option value="HQ">HQ - Haplotype quality</option>
							<option value="EHQ">EHQ - Haplotype quality based on EAF assumption</option>
							<option value="GQ">GQ - Genotype quality</option>
							<option value="DP">DP - Total read depth</option>
							<option value="AD">AD - Allelic depths</option>
							<option value="CGA_RDP">CGA_RDP - Read depth in reference</option>
							<option value="CGA_ODP">CGA_ODP - Other total read depth: somatic comparison</option>
							<option value="CGA_OAD">CGA_OAD - Other allelic depths: somatic comparison</option>
							<option value="CGA_ORDP">CGA_ORDP - Other reference depth: somatic comparison </option>
							<option value="CGA_SOMC">CGA_SOMC - Somatic Category</option>
							<option value="CGA_SOMR">CGA_SOMR - Somatic Rank</option>
							<option value="CGA_SOMS">CGA_SOMS - Somatic Score</option>
						</param>
					</when>
					
					<when value="CNV">
						<!--conditional to select inputs-->
						<conditional name="data_sources">
							<param name="data_source" type="select" label="Where are the input files?">
								<option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
							</param>
							
							<when value="out">
								<!--form field to enter input file-->
								<param name="input" type="text" label="File with list of genome root directories" size="200" help="Enter file name with full path (/path/file). This file should contain a list of genome root directory names, one per line in the format /path/dir (e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01).">
									<validator type="empty_field" message="You must supply the list of genome root directories"/>
								</param>
							</when>
						</conditional>
						
						<!--form field to select field names to include in vcf-->
						<param name="fields" type="select" label="Field names to be included in vcf file" multiple="true" help="Select all field names (default) or a collection of individual field names.">
							<option value="all" selected="true">-- all (default) --</option>
							<option value="GT">GT - Genotype</option>
							<option value="CGA_GP">CGA_GP - Normalized mean GC corrected coverage</option>
							<option value="CGA_NP">CGA_NP - Normalized mean coverage for 2k window</option>
							<option value="CGA_CP">CGA_CP - Diploid-model ploidy call for segment</option>
							<option value="CGA_PS">CGA_PS - Diploid-model called ploidy score</option>
							<option value="CGA_CT">CGA_CT - Diploid-model CNV type</option>
							<option value="CGA_TS">CGA_TS - Diploid-model CNV type score</option>
							<option value="CGA_CL">CGA_CL - Nondiploid-model called level</option>
							<option value="CGA_LS">CGA_LS - Nondiploid-model called level score</option>
							<option value="CGA_SCL">CGA_SCL - Nondiploid-model somatic called level</option>
							<option value="CGA_SLS">CGA_SLS - Non-diploid-model somatic called level score</option>
							<option value="CGA_LAF">CGA_LAF - Lesser Allele Fraction estimate, 100k window</option>
							<option value="CGA_LLAF">CGA_LLAF - Lesser Allele Fraction lower bound, 100k window</option>
							<option value="CGA_ULAF">CGA_ULAF - Lesser Allele Fraction upper bound, 100k window</option>
						</param>
					</when>
				</conditional>
			</when>
		</conditional>
  </inputs>

  <help>
  
**What it does**

This tool uses cgatools mkvcf to convert Complete Genomics masterVar files, including CNV, SV and/or MEI data, to vcf format version.

**cgatools 1.6.0 Documentation**

Userguide: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-user-guide.pdf

Release notes: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-release-notes.pdf

**Command line reference**::

		COMMAND NAME
				mkvcf - Converts var file(s) or masterVar file(s) to VCF.
		
		DESCRIPTION
				Converts var file(s) or masterVar file(s) to VCF.
		
		OPTIONS
			-h [ --help ] 
						Print this help message.
		
			--beta 
						This is a beta command. To run this command, you must pass the --beta 
						flag.
		
			--reference arg
						The reference crr file.
		
			--output arg (=STDOUT)
						The output file (may be omitted for stdout).
		
			--field-names arg (=GT,PS,NS,AN,AC,SS,FT,CGA_XR,CGA_FI,GQ,HQ,EHQ,CGA_CEHQ,GL,
							CGA_CEGL,DP,AD,CGA_RDP,CGA_ODP,CGA_OAD,CGA_ORDP,CGA_PFAM,CGA_MIRB,CGA_RPT,
							CGA_SDO,CGA_SOMC,CGA_SOMR,CGA_SOMS,CGA_GP,CGA_NP,CGA_CP,CGA_PS,CGA_CT,
							CGA_TS,CGA_CL,CGA_LS,CGA_SCL,CGA_SLS,CGA_LAF,CGA_LLAF,CGA_ULAF,CGA_IS,
							CGA_IDC,CGA_IDCL,CGA_IDCR,CGA_RDC,CGA_NBET,CGA_ETS,CGA_KES,CGA_BF,
							CGA_MEDEL,MATEID,SVTYPE,CGA_BNDG,CGA_BNDGO,CGA_BNDMPC,CGA_BNDPOS,CGA_BNDDEF,
							CGA_BNDP)
						Comma-separated list of field names. By default, all fields are 
						included, but you may override this option to ensure only a subset of 
						the fields is included in the VCF output. For a description of each 
						field, see the cgatools user guide.
		
			--source-names arg (=masterVar,CNV,SV,MEI)
						Comma-separated list of source names. The following source names are 
						available:
							masterVar - Includes records extracted from the masterVar file.
							CNV       - Includes CNV-related records.
							SV        - Includes records derived from junctions files.
							MEI       - Includes records describing mobile element insertions.
						Some of these source types are only available for more recent pipeline 
						versions, and some of these source types do not support multi-genome 
						VCFs. For more information about which source types are available for 
						which versions of the Complete Genomics pipeline software, see the 
						cgatools user guide.
		
			--genome-root arg
						For each genome to include in the VCF, the genome root directory, for 
						example /data/GS00118-DNA_A01; this directory is expected to contain 
						the ASM and LIB subdirectories, for example. You must supply this 
						option for each genome in the VCF, unless you are using 
						--source-names=masterVar and you have specified the --master-var option
						for each genome in the VCF.
		
			--master-var arg
						For each genome to include in the VCF, the masterVar file. If 
						genome-roots parameter is given, this parameter defaults to the 
						masterVar in the given genome-root.
		
			--include-no-calls 
						Small variants VCF records include loci that have no 
						reference-inconsistent calls.
						
			--calibration-root arg
						The directory containing calibration data. For example, there should 
						exist a file calibration-root/version0.0.0/metrics.tsv. This option is only 
						required if CGA_CEHQ or CGA_CEGL are included in the --field-names 
						parameter.
		
			--junction-file arg
						For each genome to include in the VCF, the junctions file. If 
						genome-roots parameter is given, this parameter defaults to the 
						respective junctions file in the export directory.
		
			--junction-score-threshold arg (=10)
						Junction score thresholds (discordant mate pair count).
		
			--junction-side-length-threshold arg (=70)
						Junction side length threshold.
		
			--junction-distance-tolerance arg (=200)
						Distance tolerance for junction compatibility.
		
			--junction-length-threshold arg (=500)
						Length threshold for compatible junctions.
		
			--junction-normal-priority 
						Normal junction priority for vcf output.
		
			--junction-tumor-hc 
						use high confidence junctions for tumors.
		
		
		SUPPORTED FORMAT_VERSION
				0.3 or later
  </help>
</tool>