annotate variant_combine.xml @ 0:1a6e16391727 draft default tip

Imported from capsule None
author devteam
date Tue, 01 Apr 2014 10:50:25 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
1 <tool id="gatk_variant_combine" name="Combine Variants" version="0.0.4">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
2 <description></description>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
3 <requirements>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
4 <requirement type="package" version="1.4">gatk</requirement>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
5 </requirements>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
6 <macros>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
7 <import>gatk_macros.xml</import>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
8 </macros>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
9 <command interpreter="python">gatk_wrapper.py
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
10 --max_jvm_heap_fraction "1"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
11 --stdout "${output_log}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
12
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
13 #set $priority_order = []
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
14 #for $input_variant in $reference_source.input_variants:
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
15 -d "--variant:${input_variant.input_variant_name},%(file_type)s" "${input_variant.input_variant}" "${input_variant.input_variant.ext}" "input_variant_${input_variant.input_variant_name}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
16 #set $input_variant_name = str( $input_variant.input_variant_name )
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
17 #assert $input_variant_name not in $priority_order, "Variant Names must be unique" ##this should be handled by a validator
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
18 #silent $priority_order.append( $input_variant_name )
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
19 #end for
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
20 -p 'java
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
21 -jar "\$JAVA_JAR_PATH/GenomeAnalysisTK.jar"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
22 -T "CombineVariants"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
23 --out "${output_variants}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
24 ##--num_threads 4 ##hard coded, for now
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
25 -et "NO_ET" ##ET no phone home
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
26 ##-log "${output_log}" ##don't use this to log to file, instead directly capture stdout
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
27 #if $reference_source.reference_source_selector != "history":
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
28 -R "${reference_source.ref_file.fields.path}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
29 #end if
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
30 --genotypemergeoption "${genotype_merge_option}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
31 --rod_priority_list "${ ','.join( $priority_order ) }"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
32 '
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
33
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
34 #include source=$standard_gatk_options#
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
35
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
36
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
37 ##start analysis specific options
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
38 #if $analysis_param_type.analysis_param_type_selector == "advanced":
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
39 -p '
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
40 --filteredrecordsmergetype "${analysis_param_type.filtered_records_merge_type}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
41 ${analysis_param_type.print_complex_merges}
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
42 ${analysis_param_type.filtered_are_uncalled}
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
43 ${analysis_param_type.minimal_vcf}
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
44 ${analysis_param_type.assume_identical_samples}
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
45
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
46 #if str( $analysis_param_type.set_key ):
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
47 --setKey "${analysis_param_type.set_key}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
48 #end if
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
49
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
50 --minimumN "${analysis_param_type.minimum_n}"
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
51 '
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
52 #end if
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
53 </command>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
54 <inputs>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
55
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
56 <conditional name="reference_source">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
57 <expand macro="reference_source_selector_param" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
58 <when value="cached">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
59 <repeat min="1" name="input_variants" title="Variants to Merge" help="Records will be prioritized in the order that you list them here (-V,--variant &amp;lt;variant&amp;gt;)">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
60 <param name="input_variant" type="data" format="vcf" label="Input variant file" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
61 <param name="input_variant_name" type="text" value="" label="Variant name" help="Names must be unique">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
62 <validator type="length" min="1" message="You must provide a unique name for this set of variants" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
63 </param>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
64 </repeat>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
65 <param name="ref_file" type="select" label="Using reference genome" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
66 <options from_data_table="gatk_picard_indexes">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
67 <!-- <filter type="data_meta" key="dbkey" ref="input_variants.input_variant" column="dbkey"/> -->
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
68 </options>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
69 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
70 </param>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
71 </when>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
72 <when value="history"> <!-- FIX ME!!!! -->
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
73 <repeat min="1" name="input_variants" title="Variants to Merge" help="Records will be prioritized in the order that you list them here (-V,--variant &amp;lt;variant&amp;gt;)">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
74 <param name="input_variant" type="data" format="vcf" label="Input variant file" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
75 <param name="input_variant_name" type="text" value="" label="Variant name" help="Names must be unique">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
76 <validator type="length" min="1" message="You must provide a unique name for this set of variants" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
77 </param>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
78 </repeat>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
79 <param name="ref_file" type="data" format="fasta" label="Using reference file" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
80 </when>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
81 </conditional>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
82
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
83 <param name="genotype_merge_option" type="select" label="How should we merge genotype records across records for samples shared across the ROD files" help="-genotypeMergeOptions,--genotypemergeoption &amp;lt;genotypemergeoption&amp;gt;" >
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
84 <option value="UNIQUIFY" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
85 <option value="PRIORITIZE" selected="true"/>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
86 <option value="UNSORTED" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
87 <option value="REQUIRE_UNIQUE" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
88 </param>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
89
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
90 <expand macro="gatk_param_type_conditional" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
91
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
92
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
93 <expand macro="analysis_type_conditional">
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
94 <param name="filtered_records_merge_type" type="select" label="How should we deal with records seen at the same site in the VCF, but with different FILTER fields?" help="-filteredRecordsMergeType,--filteredrecordsmergetype &amp;lt;filteredrecordsmergetype&amp;gt;" >
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
95 <option value="KEEP_IF_ANY_UNFILTERED" selected="true"/>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
96 <option value="KEEP_IF_ALL_UNFILTERED" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
97 </param>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
98
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
99 <param name="print_complex_merges" checked="false" type="boolean" truevalue="--printComplexMerges" falsevalue="" label="Print out interesting sites requiring complex compatibility merging" help="-printComplexMerges,--printComplexMerges" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
100 <param name="filtered_are_uncalled" checked="false" type="boolean" truevalue="--filteredAreUncalled" falsevalue="" label="If true, then filtered VCFs are treated as uncalled, so that filtered set annotation don't appear in the combined VCF" help="-filteredAreUncalled,--filteredAreUncalled" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
101 <param name="minimal_vcf" checked="false" type="boolean" truevalue="--minimalVCF" falsevalue="" label="If true, then the output VCF will contain no INFO or genotype INFO field" help="-minimalVCF,--minimalVCF" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
102
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
103 <param name="set_key" type="text" value="" label="Key, by default set, in the INFO key=value tag emitted describing which set the combined VCF record came from." help="-setKey,--setKey &amp;lt;setKey&amp;gt;"/>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
104 <param name="assume_identical_samples" checked="false" type="boolean" truevalue="--assumeIdenticalSamples" falsevalue="" label="If true, assume input VCFs have identical sample sets and disjoint calls so that one can simply perform a merge sort to combine the VCFs into one, drastically reducing the runtime." help="-assumeIdenticalSamples,--assumeIdenticalSamples" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
105 <param name="minimum_n" type="integer" value="1" label="Combine variants and output site only if variant is present in at least N input files." help="-minN,--minimumN &amp;lt;minimumN&amp;gt;"/>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
106
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
107 </expand>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
108
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
109
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
110 </inputs>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
111 <outputs>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
112 <data format="vcf" name="output_variants" label="${tool.name} on ${on_string} (variants)" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
113 <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
114 </outputs>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
115 <tests>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
116 <test>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
117 <param name="reference_source_selector" value="history" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
118 <param name="ref_file" value="phiX.fasta" ftype="fasta" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
119 <param name="input_variant" value="gatk/gatk_variant_annotator/gatk_variant_annotator_out_1.vcf" ftype="vcf" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
120 <param name="input_variant_name" value="from_variant_annotator" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
121 <param name="genotype_merge_option" value="PRIORITIZE" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
122 <param name="gatk_param_type_selector" value="basic" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
123 <param name="analysis_param_type_selector" value="basic" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
124 <output name="output_variants" file="gatk/gatk_variant_combine/gatk_variant_combine_out_1.vcf" lines_diff="4" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
125 <output name="output_log" file="gatk/gatk_variant_combine/gatk_variant_combine_out_1.log.contains" compare="contains" />
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
126 </test>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
127 </tests>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
128 <help>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
129 **What it does**
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
130
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
131 Combines VCF records from different sources; supports both full merges and set unions. Merge: combines multiple records into a single one; if sample names overlap then they are uniquified. Union: assumes each rod represents the same set of samples (although this is not enforced); using the priority list (if provided), emits a single record instance at every position represented in the rods.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
132
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
133 For more information on using the CombineVariants module, see this `tool specific page &lt;http://www.broadinstitute.org/gsa/wiki/index.php/CombineVariants&gt;`_.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
134
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
135 To learn about best practices for variant detection using GATK, see this `overview &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Best_Practice_Variant_Detection_with_the_GATK_v3&gt;`_.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
136
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
137 If you encounter errors, please view the `GATK FAQ &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Frequently_Asked_Questions&gt;`_.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
138
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
139 ------
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
140
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
141 **Inputs**
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
142
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
143 GenomeAnalysisTK: CombineVariants accepts variant files as input.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
144
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
145 ------
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
146
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
147 **Outputs**
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
148
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
149 The output is a combined vcf file.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
150
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
151
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
152 Go `here &lt;http://www.broadinstitute.org/gsa/wiki/index.php/Input_files_for_the_GATK&gt;`_ for details on GATK file formats.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
153
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
154 -------
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
155
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
156 **Settings**::
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
157
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
158 out File to which variants should be written
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
159 genotypemergeoption How should we merge genotype records for samples shared across the ROD files? (UNIQUIFY|PRIORITIZE|UNSORTED|REQUIRE_UNIQUE)
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
160 filteredrecordsmergetype How should we deal with records seen at the same site in the VCF, but with different FILTER fields? KEEP_IF_ANY_UNFILTERED PASSes the record if any record is unfiltered, KEEP_IF_ALL_UNFILTERED requires all records to be unfiltered (KEEP_IF_ANY_UNFILTERED|KEEP_IF_ALL_UNFILTERED)
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
161 rod_priority_list When taking the union of variants containing genotypes: a comma-separated string describing the priority ordering for the genotypes as far as which record gets emitted; a complete priority list MUST be provided
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
162 printComplexMerges Print out interesting sites requiring complex compatibility merging
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
163 filteredAreUncalled If true, then filtered VCFs are treated as uncalled, so that filtered set annotation don't appear in the combined VCF
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
164 minimalVCF If true, then the output VCF will contain no INFO or genotype INFO field
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
165 setKey Key, by default set, in the INFO key=value tag emitted describing which set the combined VCF record came from. Set to null if you don't want the set field emitted.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
166 assumeIdenticalSamples If true, assume input VCFs have identical sample sets and disjoint calls so that one can simply perform a merge sort to combine the VCFs into one, drastically reducing the runtime.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
167 minimumN Combine variants and output site only if variant is present in at least N input files.
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
168
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
169 @CITATION_SECTION@
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
170 </help>
1a6e16391727 Imported from capsule None
devteam
parents:
diff changeset
171 </tool>