comparison snpEff.xml @ 10:5b4ac70948d2 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/snpeff commit eea43430ff90fe6b13b295f6d5efb2208401a7ef
author iuc
date Tue, 27 Mar 2018 09:44:18 -0400
parents 68693743661e
children 5a29ab10dba6
comparison
equal deleted inserted replaced
9:68693743661e 10:5b4ac70948d2
1 <tool id="snpEff" name="SnpEff" version="@WRAPPER_VERSION@.1"> 1 <tool id="snpEff" name="SnpEff eff:" version="@wrapper_version@.1">
2 <description>Variant effect and annotation</description> 2 <description> annotate variants</description>
3 <macros> 3 <macros>
4 <import>snpEff_macros.xml</import> 4 <import>snpEff_macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="requirements" /> 6 <requirements>
7 <expand macro="requirement" />
8 </requirements>
7 <expand macro="stdio" /> 9 <expand macro="stdio" />
8 <expand macro="version_command" /> 10 <expand macro="version_command" />
9 <command><![CDATA[ 11 <command><![CDATA[
10 snpEff -Xmx8g eff 12 snpEff @java_options@ eff
11 -i $inputFormat -o ${outputConditional.outputFormat} -upDownStreamLen $udLength 13 -i $inputFormat -o ${outputConditional.outputFormat} -upDownStreamLen $udLength
12 #if $spliceSiteSize and str($spliceSiteSize) != '': 14 #if $spliceSiteSize and str($spliceSiteSize) != '':
13 -spliceSiteSize "$spliceSiteSize" 15 -spliceSiteSize "$spliceSiteSize"
14 #end if 16 #end if
15 #if $spliceRegion.setSpliceRegions == 'yes': 17 #if $spliceRegion.setSpliceRegions == 'yes':
70 #for reg in $regs: 72 #for reg in $regs:
71 -reg '"${reg}"' 73 -reg '"${reg}"'
72 #end for 74 #end for
73 #end if 75 #end if
74 '${snpDb.snpeff_db.metadata.genome_version}' 76 '${snpDb.snpeff_db.metadata.genome_version}'
77 #elif $snpDb.genomeSrc == 'custom':
78 -dataDir '${snpDb.snpeff_db.extra_files_path}'
79 -configOption '${snpDb.snpeff_db.metadata.genome_version}'.genome='${snpDb.snpeff_db.metadata.genome_version}'
80 -configOption '${snpDb.snpeff_db.metadata.genome_version}'.codonTable='${snpDb.codon_table}'
81 '${snpDb.snpeff_db.metadata.genome_version}'
75 #else 82 #else
76 -download 83 -download
77 '$snpDb.genome_version' 84 '$snpDb.genome_version'
78 #end if 85 #end if
79 '$input' > '$snpeff_output' 86 '$input' > '$snpeff_output'
90 ## Replace real SnpEff version with 2.0.5 to prevent this GATK 1.x error: "The version of SnpEff used to generate the SnpEff input file (x.x) is not currently supported by the GATK. Supported versions are: [2.0.5]" 97 ## Replace real SnpEff version with 2.0.5 to prevent this GATK 1.x error: "The version of SnpEff used to generate the SnpEff input file (x.x) is not currently supported by the GATK. Supported versions are: [2.0.5]"
91 sed -i.bak -e 's/^\#\#SnpEffVersion="\(\S*\s\)/\#\#SnpEffVersion="2.0.5 - real is \1/' '$snpeff_output' 98 sed -i.bak -e 's/^\#\#SnpEffVersion="\(\S*\s\)/\#\#SnpEffVersion="2.0.5 - real is \1/' '$snpeff_output'
92 #end if 99 #end if
93 ]]></command> 100 ]]></command>
94 <inputs> 101 <inputs>
95 <param name="input" type="data" format="vcf,tabular,pileup,bed" label="Sequence changes (SNPs, MNPs, InDels)"/> 102 <param name="input" type="data" format="vcf,bed" label="Sequence changes (SNPs, MNPs, InDels)"/>
96 103
97 <param name="inputFormat" type="select" label="Input format"> 104 <param name="inputFormat" type="select" label="Input format">
98 <option value="vcf" selected="true">VCF</option> 105 <option value="vcf" selected="true">VCF</option>
99 <option value="bed">BED (Deprecated)</option> 106 <option value="bed">BED (Deprecated)</option>
100 </param> 107 </param>
114 <when value="bedAnn" /> 121 <when value="bedAnn" />
115 </conditional> 122 </conditional>
116 123
117 <conditional name="snpDb"> 124 <conditional name="snpDb">
118 <param name="genomeSrc" type="select" label="Genome source"> 125 <param name="genomeSrc" type="select" label="Genome source">
119 <option value="cached">Locally installed reference genome</option> 126 <!-- These options are referenced in the help section of SnpEff download tool. If you change them, change help of SnpEff download as well -->
120 <option value="history">Reference genome from your history</option> 127 <option value="cached">Locally installed snpEff database</option>
121 <option value="named">Named on demand</option> 128 <option value="history">Downloaded snpEff database in your history</option>
129 <option value="named">Download on demand</option>
130 <option value="custom">Custom snpEff database in your history</option>
122 </param> 131 </param>
123 <when value="cached"> 132 <when value="cached">
124 <param name="genomeVersion" type="select" label="Genome"> 133 <param name="genomeVersion" type="select" label="Genome">
125 <!--GENOME DESCRIPTION--> 134 <!--GENOME DESCRIPTION-->
126 <options from_data_table="snpeffv_genomedb"> 135 <options from_data_table="snpeffv_genomedb">
127 <filter type="static_value" name="snpeff_version" value="@SNPEFF_VERSION@" column="1"/> 136 <filter type="static_value" name="snpeff_version" value="@snpeff_version@" column="1"/>
128 <filter type="unique_value" column="2" /> 137 <filter type="unique_value" column="2" />
129 </options> 138 </options>
130 </param> 139 </param>
131 <section name="reg_section" expanded="false" title="Regulation options"> 140 <section name="reg_section" expanded="false" title="Regulation options">
132 <param name="regulation" type="select" display="checkboxes" multiple="true" label="Non-coding and regulatory annotation" help="These are available for only a few genomes"> 141 <param name="regulation" type="select" display="checkboxes" multiple="true" label="Non-coding and regulatory annotation" help="These are available for only a few genomes">
136 </options> 145 </options>
137 </param> 146 </param>
138 </section> 147 </section>
139 </when> 148 </when>
140 <when value="history"> 149 <when value="history">
141 <param name="snpeff_db" type="data" format="snpeffdb" label="@SNPEFF_VERSION@ Genome Data"> 150 <param name="snpeff_db" type="data" format="snpeffdb" label="@snpeff_version@ Genome Data">
142 <options options_filter_attribute="metadata.snpeff_version" > 151 <options options_filter_attribute="metadata.snpeff_version" >
143 <filter type="add_value" value="@SNPEFF_VERSION@" /> 152 <filter type="add_value" value="@snpeff_version@" />
144 </options> 153 </options>
145 <validator type="expression" message="This version of SnpEff will only work with @SNPEFF_VERSION@ genome databases">value is not None and value.metadata.snpeff_version == "@SNPEFF_VERSION@"</validator> 154 <validator type="expression" message="This version of SnpEff will only work with @snpeff_version@ genome databases">value is not None and value.metadata.snpeff_version == "@snpeff_version@"</validator>
146 </param> 155 </param>
147 <section name="reg_section" expanded="false" title="Regulation options"> 156 <section name="reg_section" expanded="false" title="Regulation options">
148 <!-- From metadata --> 157 <!-- From metadata -->
149 <param name="regulation" type="select" display="checkboxes" multiple="true" label="Non-coding and regulatory annotation" help="These are available for only a few genomes"> 158 <param name="regulation" type="select" display="checkboxes" multiple="true" label="Non-coding and regulatory annotation" help="These are available for only a few genomes">
150 <options> 159 <options>
153 </param> 162 </param>
154 </section> 163 </section>
155 </when> 164 </when>
156 <when value="named"> 165 <when value="named">
157 <param name="genome_version" type="text" value="" label="Snpff Genome Version Name (e.g. GRCh38.76)"> 166 <param name="genome_version" type="text" value="" label="Snpff Genome Version Name (e.g. GRCh38.76)">
158 <help>@SNPEFF_DATABASE_URL@</help> 167 <help>@snpeff_database_url@</help>
159 <validator type="regex" message="A genome version name is required">\S+</validator> 168 <validator type="regex" message="A genome version name is required">\S+</validator>
160 </param> 169 </param>
161 </when> 170 </when>
171 <when value="custom">
172 <param name="snpeff_db" type="data" format="snpeffdb" label="@snpeff_version@ Genome Data">
173 <options options_filter_attribute="metadata.snpeff_version" >
174 <filter type="add_value" value="@snpeff_version@" />
175 </options>
176 <validator type="expression" message="This version of SnpEff will only work with @snpeff_version@ genome databases">value is not None and value.metadata.snpeff_version == "@snpeff_version@"</validator>
177 </param>
178 <param name="codon_table" type="select" label="Select genetic code for this sequence" help="If this sequence uses non-standard genetic code, select one from these options">
179 <option selected="true" value="Standard">Standard</option>
180 <option value="Vertebrate_Mitochondrial">Vertebrate_Mitochondrial</option>
181 <option value="Yeast_Mitochondrial">Yeast_Mitochondrial</option>
182 <option value="Mold_Mitochondrial">Mold_Mitochondrial</option>
183 <option value="Protozoan_Mitochondrial">Protozoan_Mitochondrial</option>
184 <option value="Coelenterate">Coelenterate</option>
185 <option value="Mitochondrial">Mitochondrial</option>
186 <option value="Mycoplasma">Mycoplasma</option>
187 <option value="Spiroplasma">Spiroplasma</option>
188 <option value="Invertebrate_Mitochondrial">Invertebrate_Mitochondrial</option>
189 <option value="Ciliate_Nuclear">Ciliate_Nuclear</option>
190 <option value="Dasycladacean_Nuclear">Dasycladacean_Nuclear</option>
191 <option value="Hexamita_Nuclear">Hexamita_Nuclear</option>
192 <option value="Echinoderm_Mitochondrial">Echinoderm_Mitochondrial</option>
193 <option value="Flatworm_Mitochondrial">Flatworm_Mitochondrial</option>
194 <option value="Euplotid_Nuclear">Euplotid_Nuclear</option>
195 <option value="Bacterial_and_Plant_Plastid">Bacterial_and_Plant_Plastid</option>
196 <option value="Alternative_Yeast_Nuclear">Alternative_Yeast_Nuclear</option>
197 <option value="Ascidian_Mitochondrial">Ascidian_Mitochondrial</option>
198 <option value="Alternative_Flatworm_Mitochondrial">Alternative_Flatworm_Mitochondrial</option>
199 <option value="Blepharisma_Macronuclear">Blepharisma_Macronuclear</option>
200 <option value="Chlorophycean_Mitochondrial">Chlorophycean_Mitochondrial</option>
201 <option value="Trematode_Mitochondrial">Trematode_Mitochondrial</option>
202 <option value="Scenedesmus_obliquus_Mitochondrial">Scenedesmus_obliquus_Mitochondrial</option>
203 <option value="Thraustochytrium_Mitochondrial">Thraustochytrium_Mitochondrial</option>
204 </param>
205 </when>
162 </conditional> 206 </conditional>
163 207
164 <param name="udLength" type="select" label="Upstream / Downstream length"> 208 <param name="udLength" type="select" label="Upstream / Downstream length" argument="-ud" >
165 <option value="0">No upstream / downstream intervals (0 bases)</option> 209 <option value="0">No upstream / downstream intervals (0 bases)</option>
166 <option value="200">200 bases</option> 210 <option value="200">200 bases</option>
167 <option value="500">500 bases</option> 211 <option value="500">500 bases</option>
168 <option value="1000">1000 bases</option> 212 <option value="1000">1000 bases</option>
169 <option value="2000">2000 bases</option> 213 <option value="2000">2000 bases</option>
170 <option value="5000" selected="true">5000 bases</option> 214 <option value="5000" selected="true">5000 bases</option>
171 <option value="10000">10000 bases</option> 215 <option value="10000">10000 bases</option>
172 <option value="20000">20000 bases</option> 216 <option value="20000">20000 bases</option>
173 </param> 217 </param>
174 218
175 <param name="spliceSiteSize" type="select" optional="true" label="Set size for splice sites (donor and acceptor) in bases"> 219 <param name="spliceSiteSize" type="select" optional="true" label="Set size for splice sites (donor and acceptor) in bases" argument="-ss">
176 <option value="1">1 base</option> 220 <option value="1">1 base</option>
177 <option value="2" selected="true">2 bases</option> 221 <option value="2" selected="true">2 bases</option>
178 <option value="3">3 bases</option> 222 <option value="3">3 bases</option>
179 <option value="4">4 bases</option> 223 <option value="4">4 bases</option>
180 <option value="5">5 bases</option> 224 <option value="5">5 bases</option>
189 <option value="no">Use Defaults</option> 233 <option value="no">Use Defaults</option>
190 <option value="yes">Set Splice Region Parameters</option> 234 <option value="yes">Set Splice Region Parameters</option>
191 </param> 235 </param>
192 <when value="no"/> 236 <when value="no"/>
193 <when value="yes"> 237 <when value="yes">
194 <param name="spliceRegionExonSize" type="integer" value="" min="1" max="10" optional="true" label="Set size for splice site region within exons. Default: 3 bases"/> 238 <param name="spliceRegionExonSize" type="integer" value="" min="1" max="10" optional="true" label="Set size for splice site region within exons. Default: 3 bases" argument="-spliceRegionExonSize"/>
195 <param name="spliceRegionIntronMin" type="integer" value="" min="1" max="10" optional="true" label="Set minimum number of bases for splice site region within intron. Default: 3 bases"/> 239 <param name="spliceRegionIntronMin" type="integer" value="" min="1" max="10" optional="true" label="Set minimum number of bases for splice site region within intron. Default: 3 bases" argument="-spliceRegionIntronMin"/>
196 <param name="spliceRegionIntronMax" type="integer" value="" min="1" max="10" optional="true" label="Set maximum number of bases for splice site region within intron. Default: 8 bases"/> 240 <param name="spliceRegionIntronMax" type="integer" value="" min="1" max="10" optional="true" label="Set maximum number of bases for splice site region within intron. Default: 8 bases" argument="-spliceRegionIntronMax"/>
197 </when> 241 </when>
198 </conditional> 242 </conditional>
199 243
200 <param name="annotations" type="select" display="checkboxes" multiple="true" label="Annotation options"> 244 <param name="annotations" type="select" display="checkboxes" multiple="true" label="Annotation options">
201 <option value="-formatEff">Use 'EFF' field compatible with older versions (instead of 'ANN')</option> 245 <option value="-formatEff">Use 'EFF' field compatible with older versions (instead of 'ANN')</option>
221 <!-- onlyReg option results in frequent exceptions with version 4.3k 265 <!-- onlyReg option results in frequent exceptions with version 4.3k
222 <option value="-onlyReg">Only use regulation tracks</option> 266 <option value="-onlyReg">Only use regulation tracks</option>
223 --> 267 -->
224 </param> 268 </param>
225 <!-- -cancerSamples <file> : Two column TXT file defining 'oringinal \t derived' samples. --> 269 <!-- -cancerSamples <file> : Two column TXT file defining 'oringinal \t derived' samples. -->
226 <param name="intervals" type="data" format="bed" optional="true" label="Use custom interval file for annotation"/> 270 <param name="intervals" type="data" format="bed" optional="true" label="Use custom interval file for annotation" argument="-interval"/>
227 <param name="transcripts" type="data" format="tabular" optional="true" label="Only use the transcripts in this file" help="Format is one transcript ID per line"/> 271 <param name="transcripts" type="data" format="tabular" optional="true" label="Only use the transcripts in this file" help="Format is one transcript ID per line"/>
228 <param name="filterOut" type="select" display="checkboxes" multiple="true" label="Filter output"> 272 <param name="filterOut" type="select" display="checkboxes" multiple="true" label="Filter output">
229 <option value="-no-downstream">Do not show DOWNSTREAM changes</option> 273 <option value="-no-downstream">Do not show DOWNSTREAM changes</option>
230 <option value="-no-intergenic">Do not show INTERGENIC changes</option> 274 <option value="-no-intergenic">Do not show INTERGENIC changes</option>
231 <option value="-no-intron">Do not show INTRON changes</option> 275 <option value="-no-intron">Do not show INTRON changes</option>
284 <option value="NEXT_PROT">NEXT_PROT (sequence_feature + exon_loss_variant) A 'NextProt' based annotation. Details are provided in the 'feature type' sub-field (ANN), or in the effect details (EFF). MODERATE </option> 328 <option value="NEXT_PROT">NEXT_PROT (sequence_feature + exon_loss_variant) A 'NextProt' based annotation. Details are provided in the 'feature type' sub-field (ANN), or in the effect details (EFF). MODERATE </option>
285 </param> 329 </param>
286 </when> 330 </when>
287 </conditional> 331 </conditional>
288 332
289 <param name="offset" type="select" display="radio" label="Chromosomal position"> 333 <param name="offset" type="select" display="radio" label="Chromosomal position" argument="-0 and -1">
290 <option value="default" selected="true">Use default (based on input type)</option> 334 <option value="default" selected="true">Use default (based on input type)</option>
291 <option value="-0">Force zero-based positions (both input and output)</option> 335 <option value="-0">Force zero-based positions (both input and output)</option>
292 <option value="-1">Force one-based positions (both input and output)</option> 336 <option value="-1">Force one-based positions (both input and output)</option>
293 </param> 337 </param>
294 <param name="chr" type="text" label="Text to prepend to chromosome name"> 338 <param name="chr" type="text" label="Text to prepend to chromosome name" argument="-chr">
295 <help> 339 <help>
296 By default SnpEff simplifies all chromosome names. For instance 'chr1' is just '1'. 340 By default SnpEff simplifies all chromosome names. For instance 'chr1' is just '1'.
297 You can prepend any string you want to the chromosome name 341 You can prepend any string you want to the chromosome name
298 </help> 342 </help>
299 <validator type="regex" message="No whitespace allowed">^\S*$</validator> 343 <validator type="regex" message="No whitespace allowed">^\S*$</validator>
300 </param> 344 </param>
301 <param name="generate_stats" type="boolean" truevalue="" falsevalue="-noStats" checked="true" label="Produce Summary Stats"/> 345 <param name="generate_stats" type="boolean" truevalue="" falsevalue="-noStats" checked="true" label="Produce Summary Stats" argument="-noStats"/>
302 <param name="noLog" type="boolean" truevalue="-noLog" falsevalue="" checked="true" label="Suppress reporting usage statistics to server"/> 346 <param name="noLog" type="boolean" truevalue="-noLog" falsevalue="" checked="true" label="Suppress reporting usage statistics to server" argument="-noLog"/>
303 </inputs> 347 </inputs>
304 <outputs> 348 <outputs>
305 <data name="snpeff_output" format="vcf"> 349 <data name="snpeff_output" format="vcf">
306 <change_format> 350 <change_format>
307 <when input="outputConditional.outputFormat" value="bed" format="bed" /> 351 <when input="outputConditional.outputFormat" value="bed" format="bed" />
328 </assert_contents> 372 </assert_contents>
329 </output> 373 </output>
330 </test> 374 </test>
331 </tests> 375 </tests>
332 <help><![CDATA[ 376 <help><![CDATA[
333 This tool calculate the effect of variants (SNPs/MNPs/Insertions) and deletions. 377
334 378 **What it does**
335 @EXTERNAL_DOCUMENTATION@ 379
380 SnpEff is a variant annotation and effect prediction tool. It annotates and predicts the effects of genetic variants (such as amino acid changes).
381
382 A typical SnpEff use case would be:
383
384 - **Input**: The inputs are predicted variants (SNPs, insertions, deletions and MNPs). The input file is usually obtained as a result of a sequencing experiment, and it is usually in variant call format (VCF).
385 - **Output**: SnpEff analyzes the input variants. It annotates the variants and calculates the effects they produce on known genes (e.g. amino acid changes). A list of effects and annotations that SnpEff can calculate can be found here.
386
387 By genetic variant we mean difference between a genome and a "reference" genome. As an example, imagine we are sequencing a "sample". Here "sample" can mean anything that you are interested in studying, from a cell culture, to a mouse or a cancer patient. It is a standard procedure to compare your sample sequences against the corresponding "reference genome". For instance you may compare the cancer patient genome against the "reference genome".
388
389 In a typical sequencing experiment, you will find many places in the genome where your sample differs from the reference genome. These are called "genomic variants" or just "variants".
390 Typically, variants are categorized as follows:
391
392 - SNP (Single-Nucleotide Polymorphism) Reference = 'A', Sample = 'C'
393 - Ins (Insertion) Reference = 'A', Sample = 'AGT'
394 - Del (Deletion) Reference = 'AC', Sample = 'C'
395 - MNP (Multiple-nucleotide polymorphism) Reference = 'ATA', Sample = 'GTC'
396 - MIXED (Multiple-nucleotide and an InDel) Reference = 'ATA', Sample = 'GTCAGT'
397
398 This is not a comprehensive list, it is just to give you an idea.
399
400 Suppose you have a huge file describing all the differences between your sample and the reference genome. But you want to know more about these variants than just their genetic coordinates. E.g.: Are they in a gene? In an exon? Do they change protein coding? Do they cause premature stop codons? SnpEff can help you answer all these questions. The process of adding this information about the variants is called "Annotation".
401 SnpEff provides several degrees of annotations, from simple (e.g. which gene is each variant affecting) to extremely complex annotations (e.g. will this non-coding variant affect the expression of a gene?). It should be noted that the more complex the annotations, the more it relies in computational predictions. Such computational predictions can be incorrect, so results from SnpEff (or any prediction algorithm) cannot be trusted blindly, they must be analyzed and independently validated by corresponding wet-lab experiments.
402
403 @snpeff_in_galaxy_info@
404 @external_documentation@
336 ]]> 405 ]]>
337 </help> 406 </help>
338 <expand macro="citations" /> 407 <expand macro="citations" />
339 </tool> 408 </tool>