annotate testing_cgatools-982e19c29ec0/cgatools/tools/cgatools_1.6/calldiff.xml @ 0:ef23f9cd599b draft default tip

Uploaded
author devteam
date Thu, 27 Sep 2012 13:37:59 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
1 <tool id="cg_calldiff" name="calldiff(beta) 1.6" version="1.0.1">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
2 <!--
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
3 This tool creates a GUI for the calldiff function of cgatools from Complete Genomics, Inc.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
4 written 6-18-2012 by bcrain@completegenomics.com
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
5 updated 8-14-2012 by bcrain@completegenomics.com
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
6 -->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
7
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
8 <description>compares two Complete Genomics variant files.</description>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
9
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
10 <command>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
11 <!-- print version of cgatools to STDOUT-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
12 cgatools | head -1;
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
13
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
14 <!-- print command lines to STDOUT-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
15 echo "cgatools calldiff --beta
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
16 --reference ${crr.fields.path}
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
17 --variantsA $data_sources.inputA
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
18 --variantsB $data_sources.inputB
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
19 $validation
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
20 $diploid
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
21 --locus-stats-column-count $column
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
22 --max-hypothesis-count $hypothesis
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
23 --output-prefix cg_
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
24 --reports `echo ${report1} ${report2} ${report3} ${report4} ${report5} ${somatic.report6} | sed 's/ */,/g'`
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
25 #if $somatic.report6 == "SomaticOutput"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
26 --genome-rootA $somatic.genomeA
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
27 --genome-rootB $somatic.genomeB
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
28 --calibration-root $somatic.calibration
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
29 #end if
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
30 ";
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
31
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
32 <!-- execute cgatools-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
33 cgatools calldiff --beta
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
34 --reference ${crr.fields.path}
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
35 --variantsA $data_sources.inputA
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
36 --variantsB $data_sources.inputB
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
37 $validation
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
38 $diploid
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
39 --locus-stats-column-count $column
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
40 --max-hypothesis-count $hypothesis
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
41 --output-prefix cg_
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
42 --reports `echo ${report1} ${report2} ${report3} ${report4} ${report5} ${somatic.report6} | sed 's/ */,/g'`
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
43 #if $somatic.report6 == "SomaticOutput"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
44 --genome-rootA $somatic.genomeA
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
45 --genome-rootB $somatic.genomeB
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
46 --calibration-root $somatic.calibration
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
47 #end if
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
48 </command>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
49
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
50 <outputs>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
51 <data format="tabular" name="output1" from_work_dir="cg_SuperlocusOutput.tsv" label="${tool.name} SuperlocusOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
52 <filter>(report1 == 'SuperlocusOutput')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
53 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
54 <data format="tabular" name="output2" from_work_dir="cg_SuperlocusStats.tsv" label="${tool.name} SuperlocusStats">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
55 <filter>(report2 == 'SuperlocusStats')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
56 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
57 <data format="tabular" name="output3" from_work_dir="cg_LocusOutput.tsv" label="${tool.name} LocusOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
58 <filter>(report3 == 'LocusOutput')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
59 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
60 <data format="tabular" name="output4" from_work_dir="cg_LocusStats.tsv" label="${tool.name} LocusStats">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
61 <filter>(report4 == 'LocusStats')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
62 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
63 <data format="tabular" name="output5a" from_work_dir="cg_VariantsA.tsv" label="${tool.name} VariantsA">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
64 <filter>(report5 == 'VariantOutput')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
65 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
66 <data format="tabular" name="output5b" from_work_dir="cg_VariantsB.tsv" label="${tool.name} VariantsB">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
67 <filter>(report5 == 'VariantOutput')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
68 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
69 <data format="tabular" name="output6" from_work_dir="cg_SomaticOutput.tsv" label="${tool.name} SomaticOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
70 <filter>(somatic['report6'] == 'SomaticOutput')</filter>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
71 </data>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
72 </outputs>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
73
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
74 <inputs>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
75 <!--form field to select crr file-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
76 <param name="crr" type="select" label="Reference genome (.crr file)">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
77 <options from_data_table="cg_crr_files" />
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
78 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
79
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
80 <!--conditional to select variant file input-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
81 <conditional name="data_sources">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
82 <param name="data_source" type="select" label="Where are the input varfiles?">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
83 <option value="in" selected="true">imported into Galaxy</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
84 <option value="out">located outside Galaxy (data on server or mounted drive)</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
85 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
86
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
87 <!--form field to select variant files-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
88 <when value="in">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
89 <param name="inputA" type="data" format="cg_var" label="Var file A">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
90 <validator type="dataset_ok_validator" />
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
91 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
92 metadata_name="dbkey" metadata_column="1"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
93 message="cgatools is not currently available for this build."/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
94 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
95 <param name="inputB" type="data" format="cg_var" label="Var file B">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
96 <validator type="dataset_ok_validator" />
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
97 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
98 metadata_name="dbkey" metadata_column="1"
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
99 message="cgatools is not currently available for this build."/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
100 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
101 </when>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
102
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
103 <!--form field to enter input files-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
104 <when value="out">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
105 <param name="inputA" type="text" label="Variant file A (/path/varfile)" size="300" help="Variant file can be compressed (gz, bz2), e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000/ASM/var-GS00000YYYY-ASM.tsv.bz2">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
106 <validator type="empty_field" message="You must supply a var file"/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
107 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
108 <param name="inputB" type="text" label="Variant file B (/path/varfile)" size="300" help="Variant file can be compressed (gz, bz2), e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000/ASM/var-GS00000YYYY-ASM.tsv.bz2.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
109 <validator type="empty_field" message="You must supply a var file"/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
110 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
111 </when>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
112 </conditional>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
113
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
114 <!--other parameters-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
115 <param name="diploid" type="select" label="Use diploid variant model" help="Uses varScoreEAF instead of varScoreVAF in somatic score computations. Also, uses diploid variant model instead of variable allele mixture model.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
116 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
117 <option value="--diploid">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
118 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
119
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
120 <param name="column" type="integer" label="Number of columns for locus compare classification in the locus stats file (default 15)" value="15">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
121 <validator type="empty_field" message="You must enter a value, the default is 15" />
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
122 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
123
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
124 <param name="hypothesis" type="integer" label="Maximum number of possible phasings to consider for a superlocus (default 32)" value="32">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
125 <validator type="empty_field" message="You must enter a value, the default is 32" />
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
126 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
127
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
128 <param name="validation" type="select" label="Reference cover validation (default on)" help="Turns on/off validation that all bases of a chromosome are covered by calls of the variant file.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
129 <option value="">on</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
130 <option value="--no-reference-cover-validation">off</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
131 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
132
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
133 <!--form fields to select ooutput reports-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
134 <param name="report1" type="select" label="Create report SuperlocusOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
135 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
136 <option value="SuperlocusOutput">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
137 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
138 <param name="report2" type="select" label="Create report SuperlocusStats">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
139 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
140 <option value="SuperlocusStats">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
141 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
142 <param name="report3" type="select" label="Create report LocusOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
143 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
144 <option value="LocusOutput">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
145 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
146 <param name="report4" type="select" label="Create report LocusStats">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
147 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
148 <option value="LocusStats">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
149 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
150 <param name="report5" type="select" label="Create report VariantOutput" help="Both variant files annotated by comparison results. If the somatic output report is requested, file A is also annotated with the same score ranks as produced in that report.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
151 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
152 <option value="VariantOutput">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
153 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
154
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
155 <!--conditional to select somatic reports and related inputs-->
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
156 <conditional name="somatic">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
157 <param name="report6" type="select" label="Create report SomaticOutput" help="This report can only be generated on local Galaxy instances. Report for the list of simple variations that are present only in file 'A', annotated with the score that indicates the probability of the variation being truly somatic. Note: generating this report slows calldiff by 10x-20x.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
158 <option value="">no</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
159 <option value="SomaticOutput">yes</option>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
160 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
161
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
162 <when value="SomaticOutput">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
163 <param name="genomeA" type="text" size="300" label="Directory for genome A (/path/dir)" help="The 'A' genome directory, e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000; this directory is expected to contain ASM/REF and ASM/EVIDENCE subdirectories.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
164 <validator type="empty_field" message="You must supply the genome root directory for this sample"/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
165 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
166 <param name="genomeB" type="text" size="300" label="Directory for genome B (/path/dir)" help="The 'B' genome directory, e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000; this directory is expected to contain ASM/REF and ASM/EVIDENCE subdirectories.">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
167 <validator type="empty_field" message="You must supply the genome root directory for this sample"/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
168 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
169 <param name="calibration" type="text" size="300" label="Directory containing calibration data (/path/dir)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v1.tgz">
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
170 <validator type="empty_field" message="You must supply the directory containing the calibration data"/>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
171 </param>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
172 </when>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
173 </conditional>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
174
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
175 </inputs>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
176
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
177 <help>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
178
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
179 **What it does**
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
180
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
181 This tool uses cgatools calldiff to compare two Complete Genomics variant files.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
182
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
183 **cgatools 1.6.0 Documentation**
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
184
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
185 Userguide: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-user-guide.pdf
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
186
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
187 Release notes: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-release-notes.pdf
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
188
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
189 **Command line reference**::
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
190
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
191 COMMAND NAME
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
192 calldiff - Compares two Complete Genomics variant files.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
193
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
194 DESCRIPTION
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
195 Compares two Complete Genomics variant files. Divides the genome up into
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
196 superloci of nearby variants, then compares the superloci. Also refines the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
197 comparison to determine per-call or per-locus comparison results.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
198
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
199 Comparison results are usually described by a semi-colon separated string,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
200 one per allele. Each allele's comparison result is one of the following
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
201 classifications:
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
202
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
203 ref-identical The alleles of the two variant files are identical, and
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
204 they are consistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
205 alt-identical The alleles of the two variant files are identical, and
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
206 they are inconsistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
207 ref-consistent The alleles of the two variant files are consistent,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
208 and they are consistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
209 alt-consistent The alleles of the two variant files are consistent,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
210 and they are inconsistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
211 onlyA The alleles of the two variant files are inconsistent,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
212 and only file A is inconsistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
213 onlyB The alleles of the two variant files are inconsistent,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
214 and only file B is inconsistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
215 mismatch The alleles of the two variant files are inconsistent,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
216 and they are both inconsistent with the reference.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
217 phase-mismatch The two variant files would be consistent if the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
218 hapLink field had been empty, but they are
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
219 inconsistent.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
220 ploidy-mismatch The superlocus did not have uniform ploidy.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
221
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
222 In some contexts, this classification is rolled up into a simplified
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
223 classification, which is one of "identical", "consistent", "onlyA",
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
224 "onlyB", or "mismatch".
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
225
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
226 A good place to start looking at the results is the superlocus-output file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
227 It has columns defined as follows:
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
228
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
229 SuperlocusId An identifier given to the superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
230 Chromosome The name of the chromosome.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
231 Begin The 0-based offset of the start of the superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
232 End The 0-based offset of the base one past the end of the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
233 superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
234 Classification The match classification of the superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
235 Reference The reference sequence.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
236 AllelesA A semicolon-separated list of the alleles (one per
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
237 haplotype) for variant file A, for the phasing with the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
238 best comparison result.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
239 AllelesB A semicolon-separated list of the alleles (one per
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
240 haplotype) for variant file B, for the phasing with the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
241 best comparison result.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
242
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
243 The locus-output file contains, for each locus in file A and file B that is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
244 not consistent with the reference, an annotated set of calls for the locus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
245 The calls are annotated with the following columns:
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
246
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
247 SuperlocusId The id of the superlocus containing the locus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
248 File The variant file (A or B).
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
249 LocusClassification The locus classification is determined by the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
250 varType column of the call that is inconsistent
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
251 with the reference, concatenated with a
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
252 modifier that describes whether the locus is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
253 heterozygous, homozygous, or contains no-calls.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
254 If there is no one variant in the locus (i.e.,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
255 it is heterozygous alt-alt), the locus
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
256 classification begins with "other".
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
257 LocusDiffClassification The match classification for the locus. This is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
258 defined to be the best of the comparison of the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
259 locus to the same region in the other file, or
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
260 the comparison of the superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
261
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
262 The somatic output file contains a list of putative somatic variations of
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
263 genome A. The output includes only those loci that can be classified as
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
264 snp, del, ins or sub in file A, and are called reference in the file B.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
265 Every locus is annotated with the following columns:
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
266
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
267 VarCvgA The totalReadCount from file A for this locus
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
268 (computed on the fly if file A is not a
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
269 masterVar file).
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
270 VarScoreA The varScoreVAF from file A, or varScoreEAF if
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
271 the "--diploid" option is used.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
272 RefCvgB The maximum of the uniqueSequenceCoverage
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
273 values for the locus in genome B.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
274 RefScoreB Minimum of the reference scores of the locus in
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
275 genome B.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
276 SomaticCategory The category used for determining the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
277 calibrated scores and the SomaticRank.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
278 VarScoreACalib The calibrated variant score of file A, under
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
279 the model selected by using or not using the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
280 "--diploid" option, and corrected for the count
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
281 of heterozygous variants observed in this
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
282 genome. See user guide for more information.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
283 VarScoreBCalib The calibrated reference score of file B, under
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
284 the model selected by using or not using the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
285 "--diploid" option, and corrected for the count
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
286 of heterozygous variants observed in this
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
287 genome. See user guide for more information.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
288 SomaticRank The estimated rank of this somatic mutation,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
289 amongst all true somatic mutations within this
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
290 SomaticCategory. The value is a number between
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
291 0 and 1; a value of 0.012 means, for example,
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
292 that an estimated 1.2% of the true somatic
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
293 mutations in this somaticCategory have a
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
294 somaticScore less than the somaticScore for
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
295 this mutation. See user guide for more
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
296 information.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
297 SomaticScore An integer that provides a total order on
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
298 quality for all somatic mutations. It is equal
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
299 to -10*log10( P(false)/P(true) ), under the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
300 assumption that this genome has a rate of
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
301 somatic mutation equal to 1/Mb for
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
302 SomaticCategory snp, 1/10Mb for SomaticCategory
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
303 ins, 1/10Mb for SomaticCategory del, and 1/20Mb
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
304 for SomaticCategory sub. The computation is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
305 based on the assumptions described in the user
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
306 guide, and is affected by choice of variant
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
307 model selected by using or not using the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
308 "--diploid" option.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
309 SomaticQuality Equal to VQHIGH for all somatic mutations where
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
310 SomaticScore &gt;= -10. Otherwise, this column is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
311 empty.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
312
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
313 OPTIONS
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
314 -h [ --help ]
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
315 Print this help message.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
316
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
317 --reference arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
318 The input crr file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
319
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
320 --variantsA arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
321 The "A" input variant file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
322
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
323 --variantsB arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
324 The "B" input variant file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
325
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
326 --output-prefix arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
327 The path prefix for all output reports.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
328
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
329 --reports arg (=SuperlocusOutput,SuperlocusStats,LocusOutput,LocusStats)
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
330 Comma-separated list of reports to generate. (Beware any reports whose
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
331 name begins with "Debug".) A report is one of:
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
332 SuperlocusOutput Report for superlocus classification.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
333 SuperlocusStats Report for superlocus classification stats.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
334 LocusOutput Report for locus classification.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
335 LocusStats Report for locus stats.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
336 VariantOutput Both variant files annotated by comparison
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
337 results.If the somatic output report is
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
338 requested, file A is also annotated with the
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
339 same score ranks as produced in that report.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
340 SomaticOutput Report for the list of simple variations that
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
341 are present only in file "A", annotated with
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
342 the score that indicates the probability of
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
343 the variation being truly somatic. Requires
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
344 beta, genome-rootA, and genome-rootB options
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
345 to be provided as well. Note: generating this
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
346 report slows calldiff by 10x-20x.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
347 DebugCallOutput Report for call classification.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
348 DebugSuperlocusOutput Report for debug superlocus information.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
349 DebugSomaticOutput Report for distribution estimates used for
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
350 somatic rescoring. Only produced if
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
351 SomaticOutput is also turned on.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
352
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
353 --diploid
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
354 Uses varScoreEAF instead of varScoreVAF in somatic score computations.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
355 Also, uses diploid variant model instead of variable allele mixture
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
356 model.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
357
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
358 --locus-stats-column-count arg (=15)
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
359 The number of columns for locus compare classification in the locus
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
360 stats file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
361
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
362 --max-hypothesis-count arg (=32)
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
363 The maximum number of possible phasings to consider for a superlocus.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
364
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
365 --no-reference-cover-validation
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
366 Turns off validation that all bases of a chromosome are covered by
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
367 calls of the variant file.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
368
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
369 --genome-rootA arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
370 The "A" genome directory, for example /data/GS00118-DNA_A01; this
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
371 directory is expected to contain ASM/REF and ASM/EVIDENCE
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
372 subdirectories.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
373
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
374 --genome-rootB arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
375 The "B" genome directory.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
376
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
377 --calibration-root arg
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
378 The directory containing calibration data. For example, there should
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
379 exist a file calibration-root/0.0.0/metrics.tsv.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
380
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
381 --beta
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
382 This flag enables the SomaticOutput report, which is beta
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
383 functionality.
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
384
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
385 SUPPORTED FORMAT_VERSION
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
386 0.3 or later
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
387 </help>
ef23f9cd599b Uploaded
devteam
parents:
diff changeset
388 </tool>