annotate cgatools/tools/cgatools_1.5/calldiff.xml @ 0:8ff0e55a0fc9 draft default tip

Uploaded
author completegenomics
date Fri, 22 Jun 2012 15:53:08 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
1 <tool id="cg_calldiff" name="calldiff(beta) 1.5" version="1.0.0">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
2 <!--
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
3 This tool creates a GUI for the calldiff function of cgatools from Complete Genomics, Inc.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
4 written 6-18-2012 by bcrain@completegenomics.com
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
5 -->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
6
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
7 <description>compares two Complete Genomics variant files.</description> <!--adds description in toolbar-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
8
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
9 <requirements>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
10 <requirement type="binary">cgatools</requirement>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
11 </requirements>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
12
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
13 <command> <!--run executable-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
14 cgatools | head -1;
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
15 cgatools calldiff --beta
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
16 --reference ${crr.fields.path}
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
17 --variantsA $data_sources.inputA
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
18 --variantsB $data_sources.inputB
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
19 $validation
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
20 $diploid
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
21 --locus-stats-column-count $column
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
22 --max-hypothesis-count $hypothesis
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
23 --output-prefix cg_
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
24 --reports `echo ${report1} ${report2} ${report3} ${report4} ${report5} ${somatic.report6} | sed 's/ */,/g'`
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
25 #if $somatic.report6 == "SomaticOutput"
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
26 --genome-rootA $somatic.genomeA
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
27 --genome-rootB $somatic.genomeB
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
28 --calibration-root $somatic.calibration
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
29 #end if
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
30 </command>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
31
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
32 <outputs>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
33 <data format="tabular" name="output1" from_work_dir="cg_SuperlocusOutput.tsv" label="${tool.name} on ${on_string}: SuperlocusOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
34 <filter>(report1 == 'SuperlocusOutput')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
35 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
36 <data format="tabular" name="output2" from_work_dir="cg_SuperlocusStats.tsv" label="${tool.name} on ${on_string}: SuperlocusStats">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
37 <filter>(report2 == 'SuperlocusStats')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
38 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
39 <data format="tabular" name="output3" from_work_dir="cg_LocusOutput.tsv" label="${tool.name} on ${on_string}: LocusOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
40 <filter>(report3 == 'LocusOutput')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
41 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
42 <data format="tabular" name="output4" from_work_dir="cg_LocusStats.tsv" label="${tool.name} on ${on_string}: LocusStats">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
43 <filter>(report4 == 'LocusStats')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
44 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
45 <data format="tabular" name="output5a" from_work_dir="cg_VariantsA.tsv" label="${tool.name} on ${on_string}: VariantsA">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
46 <filter>(report5 == 'VariantOutput')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
47 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
48 <data format="tabular" name="output5b" from_work_dir="cg_VariantsB.tsv" label="${tool.name} on ${on_string}: VariantsB">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
49 <filter>(report5 == 'VariantOutput')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
50 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
51 <data format="tabular" name="output6" from_work_dir="cg_SomaticOutput.tsv" label="${tool.name} on ${on_string}: SomaticOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
52 <filter>(somatic['report6'] == 'SomaticOutput')</filter>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
53 </data>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
54 </outputs>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
55
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
56 <inputs>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
57 <!--form field to select crr file-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
58 <param name="crr" type="select" label="Reference genome (.crr file)">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
59 <options from_data_table="cg_crr_files" />
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
60 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
61
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
62 <!--conditional to select variant file input-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
63 <conditional name="data_sources">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
64 <param name="data_source" type="select" label="Where are the input varfiles?">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
65 <option value="in" selected="true">imported into Galaxy</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
66 <option value="out">located outside Galaxy (available only for local Galaxy instances)</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
67 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
68 <when value="in">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
69 <!--form field to select variant files-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
70 <param name="inputA" type="data" format="cg_var" label="Var file A">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
71 <validator type="unspecified_build" />
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
72 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
73 metadata_name="dbkey" metadata_column="1"
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
74 message="cgatools is not currently available for this build."/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
75 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
76 <param name="inputB" type="data" format="cg_var" label="Var file B">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
77 <validator type="unspecified_build" />
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
78 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
79 metadata_name="dbkey" metadata_column="1"
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
80 message="cgatools is not currently available for this build."/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
81 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
82 </when>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
83 <when value="out">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
84 <!--form field to select crr file-->
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
85 <param name="inputA" type="text" label="Variant file A (/path/varfile)" size="300" help="Variant file can be compressed (gz, bz2), e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000/ASM/var-GS00000YYYY-ASM.tsv.bz2"/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
86 <param name="inputB" type="text" label="Variant file B (/path/varfile)" size="300" help="Variant file can be compressed (gz, bz2), e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000/ASM/var-GS00000YYYY-ASM.tsv.bz2."/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
87 </when>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
88 </conditional>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
89
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
90 <param name="diploid" type="select" label="Use diploid variant model" help="Uses varScoreEAF instead of varScoreVAF in somatic score computations. Also, uses diploid variant model instead of variable allele mixture model.">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
91 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
92 <option value="--diploid">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
93 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
94
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
95 <param name="column" type="integer" label="Number of columns for locus compare classification in the locus stats file (default 15)" value="15"/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
96
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
97 <param name="hypothesis" type="integer" label="Maximum number of possible phasings to consider for a superlocus (default 32)" value="32"/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
98
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
99 <param name="validation" type="select" label="Reference cover validation" help="Turns on/off validation that all bases of a chromosome are covered by calls of the variant file.">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
100 <option value="">on</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
101 <option value="--no-reference-cover-validation">off</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
102 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
103
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
104 <param name="report1" type="select" label="Create report SuperlocusOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
105 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
106 <option value="SuperlocusOutput">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
107 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
108 <param name="report2" type="select" label="Create report SuperlocusStats">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
109 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
110 <option value="SuperlocusStats">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
111 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
112 <param name="report3" type="select" label="Create report LocusOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
113 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
114 <option value="LocusOutput">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
115 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
116 <param name="report4" type="select" label="Create report LocusStats">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
117 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
118 <option value="LocusStats">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
119 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
120 <param name="report5" type="select" label="Create report VariantOutput" help="Both variant files annotated by comparison results.If the somatic output report is requested, file A is also annotated with the same score ranks as produced in that report.">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
121 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
122 <option value="VariantOutput">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
123 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
124
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
125 <conditional name="somatic">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
126 <param name="report6" type="select" label="Create report SomaticOutput" help="This report can only be generated on local Galaxy instances. Report for the list of simple variations that are present only in file 'A', annotated with the score that indicates the probability of the variation being truly somatic. Note: generating this report slows calldiff by 10x-20x.">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
127 <option value="">no</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
128 <option value="SomaticOutput">yes</option>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
129 </param>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
130 <when value="SomaticOutput">
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
131 <param name="genomeA" type="text" size="300" label="Directory for genome A (/path/dir)" help="The 'A' genome directory, e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000; this directory is expected to contain ASM/REF and ASM/EVIDENCE subdirectories."/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
132 <param name="genomeB" type="text" size="300" label="Directory for genome B (/path/dir)" help="The 'B' genome directory, e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000; this directory is expected to contain ASM/REF and ASM/EVIDENCE subdirectories."/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
133 <param name="calibration" type="text" size="300" label="Directory calibration data (/path/dir)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v1.tgz"/>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
134 </when>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
135 </conditional>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
136
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
137 </inputs>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
138
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
139 <help>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
140
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
141 **What it does**
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
142
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
143 This tool compares two Complete Genomics variant files.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
144
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
145 **cgatools 1.5.0 Documentation**
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
146
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
147 Userguide: http://cgatools.sourceforge.net/docs/1.5.0/cgatools-user-guide.pdf
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
148
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
149 Release notes: http://cgatools.sourceforge.net/docs/1.5.0/cgatools-release-notes.pdf
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
150
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
151 **Command line reference**::
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
152
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
153 COMMAND NAME
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
154 calldiff - Compares two Complete Genomics variant files.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
155
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
156 DESCRIPTION
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
157 Compares two Complete Genomics variant files. Divides the genome up into
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
158 superloci of nearby variants, then compares the superloci. Also refines the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
159 comparison to determine per-call or per-locus comparison results.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
160
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
161 Comparison results are usually described by a semi-colon separated string,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
162 one per allele. Each allele's comparison result is one of the following
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
163 classifications:
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
164
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
165 ref-identical The alleles of the two variant files are identical, and
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
166 they are consistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
167 alt-identical The alleles of the two variant files are identical, and
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
168 they are inconsistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
169 ref-consistent The alleles of the two variant files are consistent,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
170 and they are consistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
171 alt-consistent The alleles of the two variant files are consistent,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
172 and they are inconsistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
173 onlyA The alleles of the two variant files are inconsistent,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
174 and only file A is inconsistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
175 onlyB The alleles of the two variant files are inconsistent,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
176 and only file B is inconsistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
177 mismatch The alleles of the two variant files are inconsistent,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
178 and they are both inconsistent with the reference.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
179 phase-mismatch The two variant files would be consistent if the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
180 hapLink field had been empty, but they are
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
181 inconsistent.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
182 ploidy-mismatch The superlocus did not have uniform ploidy.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
183
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
184 In some contexts, this classification is rolled up into a simplified
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
185 classification, which is one of "identical", "consistent", "onlyA",
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
186 "onlyB", or "mismatch".
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
187
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
188 A good place to start looking at the results is the superlocus-output file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
189 It has columns defined as follows:
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
190
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
191 SuperlocusId An identifier given to the superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
192 Chromosome The name of the chromosome.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
193 Begin The 0-based offset of the start of the superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
194 End The 0-based offset of the base one past the end of the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
195 superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
196 Classification The match classification of the superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
197 Reference The reference sequence.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
198 AllelesA A semicolon-separated list of the alleles (one per
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
199 haplotype) for variant file A, for the phasing with the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
200 best comparison result.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
201 AllelesB A semicolon-separated list of the alleles (one per
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
202 haplotype) for variant file B, for the phasing with the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
203 best comparison result.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
204
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
205 The locus-output file contains, for each locus in file A and file B that is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
206 not consistent with the reference, an annotated set of calls for the locus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
207 The calls are annotated with the following columns:
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
208
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
209 SuperlocusId The id of the superlocus containing the locus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
210 File The variant file (A or B).
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
211 LocusClassification The locus classification is determined by the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
212 varType column of the call that is inconsistent
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
213 with the reference, concatenated with a
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
214 modifier that describes whether the locus is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
215 heterozygous, homozygous, or contains no-calls.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
216 If there is no one variant in the locus (i.e.,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
217 it is heterozygous alt-alt), the locus
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
218 classification begins with "other".
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
219 LocusDiffClassification The match classification for the locus. This is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
220 defined to be the best of the comparison of the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
221 locus to the same region in the other file, or
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
222 the comparison of the superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
223
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
224 The somatic output file contains a list of putative somatic variations of
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
225 genome A. The output includes only those loci that can be classified as
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
226 snp, del, ins or sub in file A, and are called reference in the file B.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
227 Every locus is annotated with the following columns:
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
228
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
229 VarCvgA The totalReadCount from file A for this locus
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
230 (computed on the fly if file A is not a
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
231 masterVar file).
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
232 VarScoreA The varScoreVAF from file A, or varScoreEAF if
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
233 the "--diploid" option is used.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
234 RefCvgB The maximum of the uniqueSequenceCoverage
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
235 values for the locus in genome B.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
236 RefScoreB Minimum of the reference scores of the locus in
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
237 genome B.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
238 SomaticCategory The category used for determining the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
239 calibrated scores and the SomaticRank.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
240 VarScoreACalib The calibrated variant score of file A, under
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
241 the model selected by using or not using the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
242 "--diploid" option, and corrected for the count
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
243 of heterozygous variants observed in this
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
244 genome. See user guide for more information.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
245 VarScoreBCalib The calibrated reference score of file B, under
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
246 the model selected by using or not using the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
247 "--diploid" option, and corrected for the count
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
248 of heterozygous variants observed in this
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
249 genome. See user guide for more information.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
250 SomaticRank The estimated rank of this somatic mutation,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
251 amongst all true somatic mutations within this
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
252 SomaticCategory. The value is a number between
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
253 0 and 1; a value of 0.012 means, for example,
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
254 that an estimated 1.2% of the true somatic
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
255 mutations in this somaticCategory have a
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
256 somaticScore less than the somaticScore for
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
257 this mutation. See user guide for more
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
258 information.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
259 SomaticScore An integer that provides a total order on
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
260 quality for all somatic mutations. It is equal
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
261 to -10*log10( P(false)/P(true) ), under the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
262 assumption that this genome has a rate of
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
263 somatic mutation equal to 1/Mb for
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
264 SomaticCategory snp, 1/10Mb for SomaticCategory
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
265 ins, 1/10Mb for SomaticCategory del, and 1/20Mb
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
266 for SomaticCategory sub. The computation is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
267 based on the assumptions described in the user
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
268 guide, and is affected by choice of variant
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
269 model selected by using or not using the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
270 "--diploid" option.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
271 SomaticQuality Equal to VQHIGH for all somatic mutations where
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
272 SomaticScore &gt;= -10. Otherwise, this column is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
273 empty.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
274
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
275 OPTIONS
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
276 -h [ --help ]
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
277 Print this help message.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
278
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
279 --reference arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
280 The input crr file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
281
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
282 --variantsA arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
283 The "A" input variant file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
284
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
285 --variantsB arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
286 The "B" input variant file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
287
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
288 --output-prefix arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
289 The path prefix for all output reports.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
290
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
291 --reports arg (=SuperlocusOutput,SuperlocusStats,LocusOutput,LocusStats)
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
292 Comma-separated list of reports to generate. (Beware any reports whose
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
293 name begins with "Debug".) A report is one of:
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
294 SuperlocusOutput Report for superlocus classification.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
295 SuperlocusStats Report for superlocus classification stats.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
296 LocusOutput Report for locus classification.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
297 LocusStats Report for locus stats.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
298 VariantOutput Both variant files annotated by comparison
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
299 results.If the somatic output report is
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
300 requested, file A is also annotated with the
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
301 same score ranks as produced in that report.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
302 SomaticOutput Report for the list of simple variations that
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
303 are present only in file "A", annotated with
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
304 the score that indicates the probability of
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
305 the variation being truly somatic. Requires
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
306 beta, genome-rootA, and genome-rootB options
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
307 to be provided as well. Note: generating this
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
308 report slows calldiff by 10x-20x.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
309 DebugCallOutput Report for call classification.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
310 DebugSuperlocusOutput Report for debug superlocus information.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
311 DebugSomaticOutput Report for distribution estimates used for
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
312 somatic rescoring. Only produced if
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
313 SomaticOutput is also turned on.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
314
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
315 --diploid
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
316 Uses varScoreEAF instead of varScoreVAF in somatic score computations.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
317 Also, uses diploid variant model instead of variable allele mixture
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
318 model.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
319
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
320 --locus-stats-column-count arg (=15)
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
321 The number of columns for locus compare classification in the locus
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
322 stats file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
323
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
324 --max-hypothesis-count arg (=32)
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
325 The maximum number of possible phasings to consider for a superlocus.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
326
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
327 --no-reference-cover-validation
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
328 Turns off validation that all bases of a chromosome are covered by
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
329 calls of the variant file.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
330
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
331 --genome-rootA arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
332 The "A" genome directory, for example /data/GS00118-DNA_A01; this
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
333 directory is expected to contain ASM/REF and ASM/EVIDENCE
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
334 subdirectories.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
335
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
336 --genome-rootB arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
337 The "B" genome directory.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
338
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
339 --calibration-root arg
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
340 The directory containing calibration data. For example, there should
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
341 exist a file calibration-root/0.0.0/metrics.tsv.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
342
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
343 --beta
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
344 This flag enables the SomaticOutput report, which is beta
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
345 functionality.
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
346
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
347 SUPPORTED FORMAT_VERSION
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
348 0.3 or later
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
349 </help>
8ff0e55a0fc9 Uploaded
completegenomics
parents:
diff changeset
350 </tool>