annotate haplotype_caller.xml @ 15:01ff8dd37d4d draft default tip

Uploaded
author lz_hust
date Sat, 01 Jun 2019 07:20:41 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
15
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
1 <tool id="gatk2_haplotype_caller" name="Haplotype Caller" version="@VERSION@.2">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
2 <description>Call SNPs and indels simultaneously via local de-novo assembly of haplotypes in an active region</description>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
3 <macros>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
4 <import>gatk2_macros.xml</import>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
5 </macros>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
6 <expand macro="requirements" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
7 <expand macro="version_command" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
8 <command interpreter="python">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
9 gatk2_wrapper.py
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
10 --stdout "${output_log}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
11 @BAM_INPUTS@
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
12 -p '
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
13 @JAR_PATH@
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
14 -T "HaplotypeCaller"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
15 -o "${output_vcf}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
16
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
17 \$GATK2_SITE_OPTIONS
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
18
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
19 --num_cpu_threads_per_data_thread \${GALAXY_SLOTS:-4}
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
20
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
21 #if $reference_source.reference_source_selector != "history":
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
22 -R "${reference_source.ref_file.fields.path}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
23 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
24 #if str($input_recal) != 'None':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
25 --BQSR "${input_recal}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
26 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
27 '
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
28 @DBSNP_OPTIONS@
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
29 $allow_n_cigar_reads
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
30 #include source=$standard_gatk_options#
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
31
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
32 ##start analysis specific options
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
33 #if $analysis_param_type.analysis_param_type_selector == "advanced":
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
34 -p '
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
35 #if $analysis_param_type.heterozygosity.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
36 --heterozygosity $analysis_param_type.heterozygosity
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
37 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
38 --genotyping_mode "${analysis_param_type.genotyping_mode_type.genotyping_mode}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
39 #if str( $analysis_param_type.genotyping_mode_type.genotyping_mode ) == 'GENOTYPE_GIVEN_ALLELES':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
40 --alleles "${analysis_param_type.genotyping_mode_type.input_alleles_rod}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
41 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
42 #if not $analysis_param_type.emitRefConfidence is None:
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
43 --emitRefConfidence $analysis_param_type.emitRefConfidence
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
44 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
45
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
46 ## files
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
47 #if str($analysis_param_type.activeRegionIn) != 'None':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
48 --activeRegionIn "$analysis_param_type.activeRegionIn"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
49 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
50 #if str($analysis_param_type.comp) != 'None':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
51 --comp "$analysis_param_type.comp"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
52 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
53 ##
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
54 #if str( $analysis_param_type.annotation ) != "None":
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
55 #for $annotation in str( $analysis_param_type.annotation.fields.gatk_value ).split( ','):
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
56 --annotation "${annotation}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
57 #end for
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
58 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
59 #for $additional_annotation in $analysis_param_type.additional_annotations:
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
60 --annotation "${additional_annotation.additional_annotation_name}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
61 #end for
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
62 #if str( $analysis_param_type.group ) != "None":
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
63 #for $group in str( $analysis_param_type.group ).split( ','):
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
64 --group "${group}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
65 #end for
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
66 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
67 #if str( $analysis_param_type.exclude_annotations ) != "None":
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
68 #for $annotation in str( $analysis_param_type.exclude_annotations.fields.gatk_value ).split( ','):
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
69 --excludeAnnotation "${annotation}"
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
70 #end for
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
71 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
72
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
73 ## value setings
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
74 #if $analysis_param_type.contamination_fraction_to_filter.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
75 --contamination_fraction_to_filter $analysis_param_type.contamination_fraction_to_filter
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
76 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
77 #if $analysis_param_type.minPruning.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
78 --minPruning $analysis_param_type.minPruning
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
79 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
80 #if $analysis_param_type.standard_min_confidence_threshold_for_calling.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
81 --standard_min_confidence_threshold_for_calling $analysis_param_type.standard_min_confidence_threshold_for_calling
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
82 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
83 #if $analysis_param_type.standard_min_confidence_threshold_for_emitting.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
84 --standard_min_confidence_threshold_for_emitting $analysis_param_type.standard_min_confidence_threshold_for_emitting
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
85 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
86 #if $analysis_param_type.gcpHMM.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
87 --gcpHMM $analysis_param_type.gcpHMM
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
88 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
89 #if $analysis_param_type.max_alternate_alleles.__str__.strip() != '':
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
90 --max_alternate_alleles $analysis_param_type.max_alternate_alleles
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
91 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
92 ## mode selections
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
93
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
94 #if $analysis_param_type.pair_hmm_implementation.__str__ != "None" and len($analysis_param_type.pair_hmm_implementation.__str__) > 0:
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
95 --pair_hmm_implementation $analysis_param_type.pair_hmm_implementation
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
96 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
97 ## optional outputs
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
98 #if $analysis_param_type.activeRegionOut:
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
99 --activeRegionOut $active_region_out
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
100 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
101 #if $analysis_param_type.graphOutput:
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
102 --graphOutput $graph_out
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
103 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
104 ## flags
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
105 $analysis_param_type.useAllelesTrigger
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
106 $analysis_param_type.fullHaplotype
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
107 $analysis_param_type.genotypeFullActiveRegion
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
108 $analysis_param_type.debug
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
109 '
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
110 #end if
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
111 </command>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
112 <inputs>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
113 <param name="input_recal" type="data" format="gatk_report" optional="true" label="Covariates table recalibration file" help="The input covariates table file which enables on-the-fly base quality score recalibration. Enables on-the-fly recalibrate of base qualities. The covariates tables are produced by the BaseQualityScoreRecalibrator tool. Please be aware that one should only run recalibration with the covariates file created on the same input bam(s) (-BQSR,--BQSR &amp;lt;recal_file&amp;gt;)" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
114 <conditional name="reference_source">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
115 <expand macro="reference_source_selector_param" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
116 <when value="cached">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
117 <expand macro="input_bams_cached" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
118 <param name="ref_file" type="select" label="Using reference genome" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;" >
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
119 <options from_data_table="gatk2_picard_indexes">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
120 <!-- <filter type="data_meta" key="dbkey" ref="input_bam" column="dbkey"/> does not yet work in a repeat...-->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
121 </options>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
122 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
123 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
124 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
125 <when value="history">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
126 <expand macro="input_bams_history" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
127 <param name="ref_file" type="data" format="fasta" label="Using reference file" help="-R,--reference_sequence &amp;lt;reference_sequence&amp;gt;" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
128 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
129 </conditional>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
130 <expand macro="dbsnp_param" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
131
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
132 <expand macro="allow_n_cigar_reads" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
133 <expand macro="gatk_param_type_conditional" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
134
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
135 <conditional name="analysis_param_type">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
136 <param name="analysis_param_type_selector" type="select" label="Basic or Advanced Analysis options">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
137 <option value="basic" selected="True">Basic</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
138 <option value="advanced">Advanced</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
139 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
140 <when value="basic">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
141 <!-- Do nothing here -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
142 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
143 <when value="advanced">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
144
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
145 <param name="activeRegionIn" type="data" format="bed,gatk_interval,picard_interval_list,vcf" optional="true" label="activeRegionIn" help="--activeRegionIn / -AR Use this interval list file as the active regions to process"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
146 <param name="activeRegionOut" type="boolean" checked="False" truevalue="" falsevalue="" label="activeRegionOut" help="--activeRegionOut / -ARO Output the active region to an interval list file"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
147
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
148 <param name="annotation" type="select" multiple="True" display="checkboxes" label="Annotation Types" help="-A,--annotation &amp;lt;annotation&amp;gt;">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
149 <!-- load the available annotations from an external configuration file, since additional ones can be added to local installs -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
150 <options from_data_table="gatk2_annotations">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
151 <filter type="multiple_splitter" column="tools_valid_for" separator=","/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
152 <filter type="static_value" value="HaplotypeCaller" column="tools_valid_for"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
153 </options>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
154 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
155 <repeat name="additional_annotations" title="Additional annotation" help="-A,--annotation &amp;lt;annotation&amp;gt;">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
156 <param name="additional_annotation_name" type="text" value="" label="Annotation name" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
157 </repeat>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
158 <!--
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
159 <conditional name="snpEff_rod_bind_type">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
160 <param name="snpEff_rod_bind_type_selector" type="select" label="Provide a snpEff reference-ordered data file">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
161 <option value="set_snpEff">Set snpEff</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
162 <option value="exclude_snpEff" selected="True">Don't set snpEff</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
163 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
164 <when value="exclude_snpEff">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
165 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
166 <when value="set_snpEff">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
167 <param name="snpEff_input_rod" type="data" format="vcf" label="ROD file" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
168 <param name="snpEff_rod_name" type="hidden" value="snpEff" label="ROD Name"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
169 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
170 </conditional>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
171 -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
172 <param name="group" type="select" multiple="True" display="checkboxes" label="Annotation Interfaces/Groups" help="-G,--group &amp;lt;group&amp;gt;">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
173 <option value="RodRequiringAnnotation">RodRequiringAnnotation</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
174 <option value="Standard">Standard</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
175 <option value="Experimental">Experimental</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
176 <option value="WorkInProgress">WorkInProgress</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
177 <option value="RankSumTest">RankSumTest</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
178 <!-- <option value="none">none</option> -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
179 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
180 <!-- <param name="family_string" type="text" value="" label="Family String"/> -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
181 <param name="exclude_annotations" type="select" multiple="True" display="checkboxes" label="Annotations to exclude" help="-XA,--excludeAnnotation &amp;lt;excludeAnnotation&amp;gt;" >
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
182 <!-- load the available annotations from an external configuration file, since additional ones can be added to local installs -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
183 <options from_data_table="gatk2_annotations">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
184 <filter type="multiple_splitter" column="tools_valid_for" separator=","/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
185 <filter type="static_value" value="HaplotypeCaller" column="tools_valid_for"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
186 </options>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
187 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
188
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
189 <param name="comp" type="data" format="vcf" optional="true" label="comp" help="--comp / -comp comparison VCF file"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
190 <param name="contamination_fraction_to_filter" type="float" value="0.05" optional="true" label="contamination_fraction_to_filter" help="--contamination_fraction_to_filter / -contamination Fraction of contamination in sequencing data (for all samples) to aggressively remove">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
191 <validator type="in_range" message="value between 0.00 and 1.00" min="0" max="1"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
192 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
193 <param name="debug" type="boolean" checked="False" truevalue="-debug" falsevalue="" label="debug" help="--debug / -debug If specified, print out very verbose debug information about each triggering active region"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
194
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
195 <conditional name="genotyping_mode_type">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
196 <param name="genotyping_mode" type="select" label="How to determine the alternate allele to use for genotyping" help="-gt_mode,--genotyping_mode &amp;lt;genotyping_mode&amp;gt;">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
197 <option value="DISCOVERY" selected="True">DISCOVERY</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
198 <option value="GENOTYPE_GIVEN_ALLELES">GENOTYPE_GIVEN_ALLELES</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
199 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
200 <when value="DISCOVERY">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
201 <!-- Do nothing here -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
202 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
203 <when value="GENOTYPE_GIVEN_ALLELES">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
204 <param name="input_alleles_rod" type="data" format="vcf" label="Alleles ROD file" help="-alleles,--alleles &amp;lt;alleles&amp;gt;" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
205 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
206 </conditional>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
207 <param name="graphOutput" type="boolean" checked="False" truevalue="" falsevalue="" label="graphOutput" help="--graphOutput / -graph File to which debug assembly graph information should be written"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
208 <param name="heterozygosity" type="float" value="0.0010" optional="true" label="heterozygosity" help="--heterozygosity / -hets Heterozygosity value used to compute prior likelihoods for any locus"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
209 <param name="minPruning" type="integer" value="1" optional="true" label="minPruning" help="--minPruning / -minPruning The minimum allowed pruning factor in assembly graph. Paths with &gt;= X supporting kmers are pruned from the graph">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
210 <validator type="in_range" message="value between 0 and 127" min="0" max="127"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
211 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
212 <!-- http://www.broadinstitute.org/gatk/guide/article?id=2940 -->
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
213 <param name="emitRefConfidence" type="select" optional="true" label="Output confidence estimates" help="Emitting a per-bp or summarized confidence estimate for a site being strictly homozygous-reference (--emitRefConfidence)">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
214 <option value="NONE" selected="True">don't emit anything</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
215 <option value="BP_RESOLUTION">BP_RESOLUTION (emit detailed information for each BP)</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
216 <option value="GVCF">GVCF (emit a block summarized version of the BP_RESOLUTION data)</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
217 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
218 <param name="pair_hmm_implementation" type="select" optional="true" label="pair_hmm_implementation" help="--pair_hmm_implementation / -pairHMM The PairHMM implementation to use for genotype likelihood calculations">
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
219 <option value="EXACT">EXACT</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
220 <option value="ORIGINAL">ORIGINAL</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
221 <option value="CACHING">CACHING</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
222 <option value="LOGLESS_CACHING" selected="True">LOGLESS_CACHING</option>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
223 </param>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
224 <param name="standard_min_confidence_threshold_for_calling" type="float" value="30.0" optional="true" label="standard_min_confidence_threshold_for_calling" help="--standard_min_confidence_threshold_for_calling / -stand_call_conf The minimum phred-scaled confidence threshold at which variants should be called"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
225 <param name="standard_min_confidence_threshold_for_emitting" type="float" value="30.0" optional="true" label="standard_min_confidence_threshold_for_emitting" help="--standard_min_confidence_threshold_for_emitting / -stand_emit_conf The minimum phred-scaled confidence threshold at which variants should be emitted (and filtered with LowQual if less than the calling threshold)"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
226 <param name="useAllelesTrigger" type="boolean" checked="False" truevalue="-allelesTrigger" falsevalue="" label="useAllelesTrigger" help="--useAllelesTrigger / -allelesTrigger If specified, use additional trigger on variants found in an external alleles file"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
227 <param name="fullHaplotype" type="boolean" checked="False" truevalue="-fullHaplotype" falsevalue="" label="fullHaplotype" help="--fullHaplotype / -fullHaplotype If specified, output the full haplotype sequence instead of converting to individual variants w.r.t. the reference"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
228 <param name="gcpHMM" type="integer" value="10" optional="true" label="gcpHMM" help="--gcpHMM / -gcpHMM Flat gap continuation penalty for use in the Pair HMM"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
229 <param name="genotypeFullActiveRegion" type="boolean" checked="False" truevalue="-genotypeFullActiveRegion" falsevalue="" label="genotypeFullActiveRegion" help="--genotypeFullActiveRegion / -genotypeFullActiveRegion If specified, alternate alleles are considered to be the full active region for the purposes of genotyping"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
230 <param name="max_alternate_alleles" type="integer" value="6" optional="true" label="max_alternate_alleles" help="--max_alternate_alleles / -maxAltAlleles Maximum number of alternate alleles to genotype"/>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
231 </when>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
232 </conditional>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
233 </inputs>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
234 <outputs>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
235 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (VCF)" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
236 <data format="vcf" name="graph_out" label="${tool.name} on ${on_string} graph" >
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
237 <filter>analysis_param_type['analysis_param_type_selector'] == "advanced" and analysis_param_type['graphOutput'] == True</filter>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
238 </data>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
239 <data format="vcf" name="active_region_out" label="${tool.name} on ${on_string} activeRegion" >
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
240 <filter>analysis_param_type['analysis_param_type_selector'] == "advanced" and analysis_param_type['activeRegionOut'] == True</filter>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
241 </data>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
242 <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
243 </outputs>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
244 <tests>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
245 <test>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
246 <param name="input_recal" value="gatk/gatk_count_covariates/gatk_count_covariates_out_1.csv" ftype="csv" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
247 <param name="reference_source_selector" value="history" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
248 <param name="ref_file" value="phiX.fasta" ftype="fasta" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
249 <param name="input_bam" value="gatk/gatk_indel_realigner/gatk_indel_realigner_out_1.bam" ftype="bam" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
250 <param name="gatk_param_type_selector" value="basic" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
251 <param name="analysis_param_type_selector" value="basic" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
252 <output name="output_bam" file="gatk/gatk_table_recalibration/gatk_table_recalibration_out_1.bam" ftype="bam" lines_diff="4" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
253 <output name="output_log" file="gatk/gatk_table_recalibration/gatk_table_recalibration_out_1.log.contains" compare="contains" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
254 </test>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
255 </tests>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
256 <help>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
257 **What it does**
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
258
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
259 **HaplotypeCaller**
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
260 calls SNPs and indels simultaneously via local de-novo assembly of haplotypes in an active region.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
261 Haplotypes are evaluated using an affine gap penalty Pair HMM.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
262
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
263 For more information on using read based compression in the GATK, see this `tool specific page &lt;http://www.broadinstitute.org/gatk/gatkdocs/org_broadinstitute_sting_gatk_walkers_haplotypecaller_HaplotypeCaller.html&gt;`_.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
264
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
265 To learn about best practices for variant detection using GATK, see this `overview &lt;http://www.broadinstitute.org/gatk/guide/topic?name=best-practices&gt;`_.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
266
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
267 If you encounter errors, please view the `GATK FAQ &lt;http://www.broadinstitute.org/gatk/guide/topic?name=faqs&gt;`_.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
268
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
269 ------
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
270
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
271 **Inputs**
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
272
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
273 GenomeAnalysisTK: PrintReads accepts aligned BAM files.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
274
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
275
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
276 **Outputs**
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
277
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
278 The output is a VCF file with raw, unrecalibrated SNP and indel calls.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
279
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
280
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
281 Go `here &lt;http://www.broadinstitute.org/gatk/guide/topic?name=intro&gt;`_ for details on GATK file formats.
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
282
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
283 -------
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
284
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
285 **Settings**::
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
286
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
287 activeRegionIn Use this interval list file as the active regions to process
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
288 activeRegionOut Output the active region to this interval list file
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
289 alleles The set of alleles at which to genotype when --genotyping_mode is GENOTYPE_GIVEN_ALLELES
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
290 annotation One or more specific annotations to apply to variant calls
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
291 comp comparison VCF file
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
292 contamination Fraction of contamination in sequencing data (for all samples) to aggressively remove
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
293 dbsnp dbSNP file
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
294 debug If specified, print out very verbose debug information about each triggering active region
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
295 excludeAnnotation One or more specific annotations to exclude
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
296 genotyping_mode Specifies how to determine the alternate alleles to use for genotyping
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
297 graphOutput File to which debug assembly graph information should be written
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
298 group One or more classes/groups of annotations to apply to variant calls
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
299 heterozygosity Heterozygosity value used to compute prior likelihoods for any locus
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
300 minPruning The minimum allowed pruning factor in assembly graph. Paths with less than or equal supporting kmers are pruned from the graph
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
301 pair_hmm_implementation The PairHMM implementation to use for genotype likelihood calculations
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
302 stand_call_conf The minimum phred-scaled confidence threshold at which variants should be called
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
303 stand_emit_conf The minimum phred-scaled confidence threshold at which variants should be emitted (and filtered with LowQual if less than the calling threshold)
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
304 useAllelesTrigger If specified, use additional trigger on variants found in an external alleles file
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
305 fullHaplotype If specified, output the full haplotype sequence instead of converting to individual variants w.r.t. the reference
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
306 gcpHMM Flat gap continuation penalty for use in the Pair HMM
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
307 genotypeFullActiveRegion If specified, alternate alleles are considered to be the full active region for the purposes of genotyping
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
308 max_alternate_alleles Maximum number of alternate alleles to genotype
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
309
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
310 @CITATION_SECTION@
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
311 </help>
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
312 <expand macro="citations" />
01ff8dd37d4d Uploaded
lz_hust
parents:
diff changeset
313 </tool>