comparison snpEff.xml @ 0:2a3a00c1fa0a draft default tip

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/snpeff commit e6d1b32be9df14beb1e2859a0d2fa29a2d09227e"
author iuc
date Thu, 18 Jun 2020 16:11:49 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:2a3a00c1fa0a
1 <tool id="snpeff_sars_cov_2" name="SnpEff eff:" version="@WRAPPER_VERSION@">
2 <description> annotate variants for SARS-CoV-2</description>
3 <macros>
4 <import>snpEff_macros.xml</import>
5 </macros>
6 <requirements>
7 <expand macro="requirement" />
8 </requirements>
9 <expand macro="stdio" />
10 <expand macro="version_command" />
11 <command><![CDATA[
12 snpEff @JAVA_OPTIONS@ eff
13 -i $inputFormat -o ${outputConditional.outputFormat} -upDownStreamLen $udLength
14 #if $annotations and str($annotations) != '':
15 #echo " "
16 #echo ' '.join(str($annotations).split(','))
17 #end if
18 #if $filterOut and str($filterOut) != '':
19 #echo " "
20 #echo ' '.join(str($filterOut).split(','))
21 #end if
22 #if $filter.specificEffects == 'yes' and $filter.effects:
23 #for $eff in str($filter.effects).split(','):
24 -no $eff
25 #end for
26 #end if
27 #if $transcripts
28 -onlyTr '$transcripts'
29 #end if
30 #if $intervals ### fix this for multiple dataset input
31 -interval '$intervals'
32 #end if
33 #if $statsFile:
34 -stats '$statsFile'
35 #end if
36 #if $csvStats:
37 -csvStats '$csvFile'
38 #end if
39 #if str($offset) != 'default':
40 ${offset}
41 #end if
42 #if str($chr).strip() != '':
43 -chr '$chr'
44 #end if
45 $noLog
46
47 $genome_version
48
49 '$input' > '$snpeff_output'
50
51 #if $statsFile:
52 &&
53 #import os
54 #if $csvStats:
55 #set $genes_file = str($csvFile) + '.genes.txt'
56 #else
57 #set $genes_file = str($statsFile) + '.genes.txt'
58 #end if
59 #set $genes_file_name = os.path.split($genes_file)[-1]
60 mkdir '$statsFile.files_path' &&
61 mv '$genes_file' '#echo os.path.join($statsFile.files_path, $genes_file_name)#'
62 #end if
63 #if $outputConditional.outputFormat == 'gatk' and $outputConditional.gatk_v1
64 &&
65 ## Replace real SnpEff version with 2.0.5 to prevent this GATK 1.x error: "The version of SnpEff used to generate the SnpEff input file (x.x) is not currently supported by the GATK. Supported versions are: [2.0.5]"
66 sed -i.bak -e 's/^\#\#SnpEffVersion="\(\S*\s\)/\#\#SnpEffVersion="2.0.5 - real is \1/' '$snpeff_output'
67 #end if
68 ]]></command>
69 <inputs>
70 <param name="input" type="data" format="vcf,bed" label="Sequence changes (SNPs, MNPs, InDels)"/>
71
72 <param name="inputFormat" type="select" label="Input format">
73 <option value="vcf" selected="true">VCF</option>
74 <option value="bed">BED (Deprecated)</option>
75 </param>
76
77 <param name="genome_version" type="select" label="Select an annotated Coronavirus genome">
78 <option value="NC_045512.2">NC_045512.2: COVID19 Severe acute respiratory syndrome coronavirus 2 isolate Wuhan-Hu-1</option>
79 <option value="DQ648856.1">DQ648856.1: Bat coronavirus (BtCoV/273/2005), complete genome.</option>
80 <option value="DQ648857.1">DQ648857.1: Bat coronavirus (BtCoV/279/2005), complete genome.</option>
81 <option value="JX993988.1">JX993988.1: Bat coronavirus Cp/Yunnan2011, complete genome.</option>
82 <option value="MN996532.1">MN996532.1: Bat coronavirus RaTG13, complete genome.</option>
83 <option value="JX993987.1">JX993987.1: Bat coronavirus Rp/Shaanxi2011, complete genome.</option>
84 <option value="GQ153545.1">GQ153545.1: Bat SARS coronavirus HKU3-10, complete genome.</option>
85 <option value="GQ153546.1">GQ153546.1: Bat SARS coronavirus HKU3-11, complete genome.</option>
86 <option value="GQ153547.1">GQ153547.1: Bat SARS coronavirus HKU3-12, complete genome.</option>
87 <option value="DQ022305.2">DQ022305.2: Bat SARS coronavirus HKU3-1, complete genome.</option>
88 <option value="DQ084199.1">DQ084199.1: bat SARS coronavirus HKU3-2, complete genome.</option>
89 <option value="DQ084200.1">DQ084200.1: bat SARS coronavirus HKU3-3, complete genome.</option>
90 <option value="GQ153539.1">GQ153539.1: Bat SARS coronavirus HKU3-4, complete genome.</option>
91 <option value="GQ153540.1">GQ153540.1: Bat SARS coronavirus HKU3-5, complete genome.</option>
92 <option value="GQ153541.1">GQ153541.1: Bat SARS coronavirus HKU3-6, complete genome.</option>
93 <option value="GQ153542.1">GQ153542.1: Bat SARS coronavirus HKU3-7, complete genome.</option>
94 <option value="GQ153543.1">GQ153543.1: Bat SARS coronavirus HKU3-8, complete genome.</option>
95 <option value="GQ153544.1">GQ153544.1: Bat SARS coronavirus HKU3-9, complete genome.</option>
96 <option value="FJ588686.1">FJ588686.1: Bat SARS CoV Rs672/2006, complete genome.</option>
97 <option value="KC881006.1">KC881006.1: Bat SARS-like coronavirus Rs3367, complete genome.</option>
98 <option value="KC881005.1">KC881005.1: Bat SARS-like coronavirus RsSHC014, complete genome.</option>
99 <option value="KF367457.1">KF367457.1: Bat SARS-like coronavirus WIV1, complete genome.</option>
100 <option value="KP886808.1">KP886808.1: Bat SARS-like coronavirus YNLF_31C, complete genome.</option>
101 <option value="KP886809.1">KP886809.1: Bat SARS-like coronavirus YNLF_34C, complete genome.</option>
102 <option value="KJ473812.1">KJ473812.1: BtRf-BetaCoV/HeB2013, complete genome.</option>
103 <option value="KJ473811.1">KJ473811.1: BtRf-BetaCoV/JL2012, complete genome.</option>
104 <option value="KJ473813.1">KJ473813.1: BtRf-BetaCoV/SX2013, complete genome.</option>
105 <option value="KJ473815.1">KJ473815.1: BtRs-BetaCoV/GX2013, complete genome.</option>
106 <option value="KJ473814.1">KJ473814.1: BtRs-BetaCoV/HuB2013, complete genome.</option>
107 <option value="KJ473816.1">KJ473816.1: BtRs-BetaCoV/YN2013, complete genome.</option>
108 <option value="KF569996.1">KF569996.1: Rhinolophus affinis coronavirus isolate LYRa11, complete genome.</option>
109 <option value="AY687354.1">AY687354.1: SARS coronavirus A001 spike glycoprotein gene, complete cds.</option>
110 <option value="AY687355.1">AY687355.1: SARS coronavirus A013 spike glycoprotein gene, complete cds.</option>
111 <option value="AY687356.1">AY687356.1: SARS coronavirus A021 spike glycoprotein gene, complete cds.</option>
112 <option value="AY686863.1">AY686863.1: SARS coronavirus A022, complete genome.</option>
113 <option value="AY687357.1">AY687357.1: SARS coronavirus A030 spike glycoprotein gene, complete cds.</option>
114 <option value="AY687358.1">AY687358.1: SARS coronavirus A031 spike glycoprotein gene, complete cds.</option>
115 <option value="AY427439.1">AY427439.1: SARS coronavirus AS, complete genome.</option>
116 <option value="AY687359.1">AY687359.1: SARS coronavirus B012 spike glycoprotein gene, complete cds.</option>
117 <option value="AY687360.1">AY687360.1: SARS coronavirus B024 spike glycoprotein gene, complete cds.</option>
118 <option value="AY687361.1">AY687361.1: SARS coronavirus B029 spike glycoprotein gene, complete cds.</option>
119 <option value="AY687362.1">AY687362.1: SARS coronavirus B033 spike glycoprotein gene, complete cds.</option>
120 <option value="AY686864.1">AY686864.1: SARS coronavirus B039, complete genome.</option>
121 <option value="AY687364.1">AY687364.1: SARS coronavirus B040 spike glycoprotein gene, complete cds.</option>
122 <option value="AY278488.2">AY278488.2: SARS coronavirus BJ01, complete genome.</option>
123 <option value="AY279354.2">AY279354.2: SARS coronavirus BJ04, complete genome.</option>
124 <option value="AY864805.1">AY864805.1: SARS coronavirus BJ162, complete genome.</option>
125 <option value="EU371564.1">EU371564.1: SARS coronavirus BJ182-12, complete genome.</option>
126 <option value="EU371562.1">EU371562.1: SARS coronavirus BJ182-4, complete genome.</option>
127 <option value="EU371563.1">EU371563.1: SARS coronavirus BJ182-8, complete genome.</option>
128 <option value="EU371560.1">EU371560.1: SARS coronavirus BJ182a, complete genome.</option>
129 <option value="EU371561.1">EU371561.1: SARS coronavirus BJ182b, complete genome.</option>
130 <option value="AY864806.1">AY864806.1: SARS coronavirus BJ202, complete genome.</option>
131 <option value="AY340092.1">AY340092.1: SARS coronavirus BJ2232 RNA polymerase gene, partial cds.</option>
132 <option value="AY714217.1">AY714217.1: SARS Coronavirus CDC#200301157, complete genome.</option>
133 <option value="AY572034.1">AY572034.1: SARS coronavirus civet007, complete genome.</option>
134 <option value="AY572035.1">AY572035.1: SARS coronavirus civet010, complete genome.</option>
135 <option value="AY572038.1">AY572038.1: SARS coronavirus civet020, complete genome.</option>
136 <option value="AY345986.1">AY345986.1: SARS coronavirus CUHK-AG01, complete genome.</option>
137 <option value="AY345987.1">AY345987.1: SARS coronavirus CUHK-AG02, complete genome.</option>
138 <option value="AY345988.1">AY345988.1: SARS coronavirus CUHK-AG03, complete genome.</option>
139 <option value="AY282752.2">AY282752.2: SARS coronavirus CUHK-Su10, complete genome.</option>
140 <option value="AY278554.2">AY278554.2: SARS coronavirus CUHK-W1, complete genome.</option>
141 <option value="AY310120.1">AY310120.1: SARS coronavirus FRA, complete genome.</option>
142 <option value="AY278489.2">AY278489.2: SARS coronavirus GD01, complete genome.</option>
143 <option value="AY313906.1">AY313906.1: SARS coronavirus GD69, complete genome.</option>
144 <option value="DQ640652.1">DQ640652.1: SARS coronavirus GDH-BJH01, complete genome.</option>
145 <option value="AY390556.1">AY390556.1: SARS coronavirus GZ02, complete genome.</option>
146 <option value="AY568539.1">AY568539.1: SARS coronavirus GZ0401, complete genome.</option>
147 <option value="AY613947.1">AY613947.1: SARS coronavirus GZ0402, complete genome.</option>
148 <option value="AY304495.1">AY304495.1: SARS coronavirus GZ50, complete genome.</option>
149 <option value="AY394978.1">AY394978.1: SARS coronavirus GZ-B, complete genome.</option>
150 <option value="AY394979.1">AY394979.1: SARS coronavirus GZ-C, complete genome.</option>
151 <option value="AY515512.1">AY515512.1: SARS coronavirus HC/SZ/61/03, complete genome.</option>
152 <option value="JQ316196.1">JQ316196.1: SARS coronavirus HKU-39849 isolate UOB, complete genome.</option>
153 <option value="AY323977.2">AY323977.2: SARS coronavirus HSR 1, complete genome.</option>
154 <option value="AY595412.1">AY595412.1: SARS coronavirus LLJ-2004, complete genome.</option>
155 <option value="AY508724.1">AY508724.1: SARS coronavirus NS-1, complete genome.</option>
156 <option value="FJ882963.1">FJ882963.1: SARS coronavirus P2, complete genome.</option>
157 <option value="AY350750.1">AY350750.1: SARS coronavirus PUMC01, complete genome.</option>
158 <option value="AY357075.1">AY357075.1: SARS coronavirus PUMC02, complete genome.</option>
159 <option value="AY357076.1">AY357076.1: SARS coronavirus PUMC03, complete genome.</option>
160 <option value="AY463059.1">AY463059.1: SARS coronavirus ShanghaiQXC1, complete genome.</option>
161 <option value="AY463060.1">AY463060.1: SARS coronavirus ShanghaiQXC2, complete genome.</option>
162 <option value="AY485277.1">AY485277.1: SARS coronavirus Sino1-11, complete genome.</option>
163 <option value="AY485278.1">AY485278.1: SARS coronavirus Sino3-11, complete genome.</option>
164 <option value="AY304488.1">AY304488.1: SARS coronavirus SZ16, complete genome.</option>
165 <option value="AY304486.1">AY304486.1: SARS coronavirus SZ3, complete genome.</option>
166 <option value="AY338174.1">AY338174.1: SARS coronavirus Taiwan TC1, complete genome.</option>
167 <option value="AY338175.1">AY338175.1: SARS coronavirus Taiwan TC2, complete genome.</option>
168 <option value="AY348314.1">AY348314.1: SARS coronavirus Taiwan TC3, complete genome.</option>
169 <option value="AY654624.1">AY654624.1: SARS coronavirus TJF, complete genome.</option>
170 <option value="AY502923.1">AY502923.1: SARS coronavirus TW10, complete genome.</option>
171 <option value="AY502924.1">AY502924.1: SARS coronavirus TW11, complete genome.</option>
172 <option value="AY291451.1">AY291451.1: SARS coronavirus TW1, complete genome.</option>
173 <option value="AY502925.1">AY502925.1: SARS coronavirus TW2, complete genome.</option>
174 <option value="AY502926.1">AY502926.1: SARS coronavirus TW3, complete genome.</option>
175 <option value="AY502927.1">AY502927.1: SARS coronavirus TW4, complete genome.</option>
176 <option value="AY502928.1">AY502928.1: SARS coronavirus TW5, complete genome.</option>
177 <option value="AY502929.1">AY502929.1: SARS coronavirus TW6, complete genome.</option>
178 <option value="AY502930.1">AY502930.1: SARS coronavirus TW7, complete genome.</option>
179 <option value="AY502931.1">AY502931.1: SARS coronavirus TW8, complete genome.</option>
180 <option value="AY502932.1">AY502932.1: SARS coronavirus TW9, complete genome.</option>
181 <option value="AP006557.1">AP006557.1: SARS coronavirus TWH genomic RNA, complete genome.</option>
182 <option value="AP006558.1">AP006558.1: SARS coronavirus TWJ genomic RNA, complete genome.</option>
183 <option value="AP006559.1">AP006559.1: SARS coronavirus TWK genomic RNA, complete genome.</option>
184 <option value="AP006560.1">AP006560.1: SARS coronavirus TWS genomic RNA, complete genome.</option>
185 <option value="AP006561.1">AP006561.1: SARS coronavirus TWY genomic RNA, complete genome.</option>
186 <option value="AY278741.1">AY278741.1: SARS coronavirus Urbani, complete genome.</option>
187 <option value="MK062181.1">MK062181.1: SARS coronavirus Urbani isolate icSARS-C3, complete genome.</option>
188 <option value="MK062182.1">MK062182.1: SARS coronavirus Urbani isolate icSARS-C3-MA, complete genome.</option>
189 <option value="MK062183.1">MK062183.1: SARS coronavirus Urbani isolate icSARS-C7, complete genome.</option>
190 <option value="MK062184.1">MK062184.1: SARS coronavirus Urbani isolate icSARS-C7-MA, complete genome.</option>
191 <option value="MK062179.1">MK062179.1: SARS coronavirus Urbani isolate icSARS, complete genome.</option>
192 <option value="MK062180.1">MK062180.1: SARS coronavirus Urbani isolate icSARS-MA, complete genome.</option>
193 <option value="AY772062.1">AY772062.1: SARS coronavirus WH20, complete genome.</option>
194 <option value="EU371559.1">EU371559.1: SARS coronavirus ZJ02, complete genome.</option>
195 <option value="DQ182595.1">DQ182595.1: SARS coronavirus ZJ0301 from China, complete genome.</option>
196 </param>
197
198 <conditional name="outputConditional">
199 <param name="outputFormat" type="select" label="Output format">
200 <option value="vcf" selected="true">VCF (only if input is VCF)</option>
201 <option value="gatk">GATK-compatible VCF (only if input is VCF)</option>
202 <option value="bed">BED</option>
203 <option value="bedAnn">BED annotations</option>
204 </param>
205 <when value="vcf" />
206 <when value="gatk">
207 <param name="gatk_v1" type="boolean" checked="true" label="Compatible with GATK 1.x" />
208 </when>
209 <when value="bed" />
210 <when value="bedAnn" />
211 </conditional>
212 <param name="csvStats" type="boolean" truevalue="-csvStats" falsevalue="" checked="false" label="Create CSV report, useful for downstream analysis (-csvStats)" />
213
214 <param name="udLength" argument="-ud" type="select" label="Upstream / Downstream length">
215 <option value="0" selected="true">No upstream / downstream intervals (0 bases)</option>
216 <option value="10">10 bases</option>
217 <option value="50">50 bases</option>
218 <option value="100">100 bases</option>
219 <option value="200">200 bases</option>
220 <option value="500">500 bases</option>
221 <option value="1000">1000 bases</option>
222 <option value="2000">2000 bases</option>
223 <option value="5000">5000 bases</option>
224 </param>
225
226 <param name="annotations" type="select" display="checkboxes" multiple="true" label="Annotation options">
227 <option value="-formatEff">Use 'EFF' field compatible with older versions (instead of 'ANN')</option>
228 <option value="-classic">Use Classic Effect names and amino acid variant annotations (NON_SYNONYMOUS_CODING vs missense_variant and G180R vs p.Gly180Arg/c.538G>C)</option>
229 <option value="-sequenceOntology">Override classic and use Sequence Ontolgy terms for effects (missense_variant vs NON_SYNONYMOUS_CODING)</option>
230 <option value="-hgvs">Override classic and use HGVS annotations for amino acid annotations (p.Gly180Arg/c.538G>C vs G180R)</option>
231 <option value="-hgvsOld">Old notation style notation: E.g. 'c.G123T' instead of 'c.123G>T' and 'X' instead of '*'</option>
232 <option value="-hgvs1LetterAa">Use one letter Amino acid codes in HGVS notation. E.g. p.R47G instead of p.Arg47Gly</option>
233 <option value="-hgvsTrId">Use transcript ID in HGVS notation. E.g. ENST00000252100:c.914C>G instead of c.914C>G</option>
234 <option value="-noShiftHgvs">Do not shift variants according to HGVS notation (most 3prime end)</option>
235 <option value="-noHgvs">Do not add HGVS annotations</option>
236 <option value="-canon">Only use canonical transcripts</option>
237 <option value="-onlyProtein">Only use protein coding transcripts</option>
238 <option value="-geneId">Use gene ID instead of gene name (VCF output)</option>
239 <option value="-noExpandIUB">Disable IUB code expansion in input variants</option>
240 <option value="-oicr">Add OICR tag in VCF file</option>
241 <option value="-noLof">Do not add LOF and NMD annotations</option>
242 <option value="-noInteraction">Disable interaction annotations</option>
243 </param>
244 <!-- -cancerSamples <file> : Two column TXT file defining 'oringinal \t derived' samples. -->
245 <param name="intervals" argument="-interval" type="data" format="bed" optional="true" label="Use custom interval file for annotation" />
246 <param name="transcripts" type="data" format="tabular" optional="true" label="Only use the transcripts in this file" help="Format is one transcript ID per line"/>
247 <param name="filterOut" type="select" display="checkboxes" multiple="true" label="Filter output">
248 <option value="-no-downstream">Do not show DOWNSTREAM changes</option>
249 <option value="-no-intergenic">Do not show INTERGENIC changes</option>
250 <option value="-no-upstream">Do not show UPSTREAM changes</option>
251 <option value="-no-utr">Do not show 5_PRIME_UTR or 3_PRIME_UTR changes</option>
252 </param>
253 <conditional name="filter">
254 <param name="specificEffects" type="select" label="Filter out specific Effects">
255 <option value="no">No</option>
256 <option value="yes">Yes</option>
257 </param>
258 <when value="no"/>
259 <when value="yes">
260 <param name="effects" type="select" display="checkboxes" multiple="true" label="Filter output: do not report these Effects">
261 <option value="CDS">CDS (coding_sequence_variant) The variant hits a CDS. MODIFIER</option>
262 <option value="CHROMOSOME_LARGE_DELETION">CHROMOSOME_LARGE_DELETION (chromosome) A large parte (over 1%) of the chromosome was deleted. HIGH</option>
263 <option value="CODON_CHANGE">CODON_CHANGE (coding_sequence_variant) One or many codons are changed e.g.: An MNP of size multiple of 3 MODERATE</option>
264 <option value="CODON_INSERTION">CODON_INSERTION (inframe_insertion) One or many codons are inserted e.g.: An insert multiple of three in a codon boundary MODERATE</option>
265 <option value="CODON_CHANGE_PLUS_CODON_INSERTION">CODON_CHANGE_PLUS_CODON_INSERTION (disruptive_inframe_insertion) One codon is changed and one or many codons are inserted e.g.: An insert of size multiple of three, not at codon boundary MODERATE</option>
266 <option value="CODON_DELETION">CODON_DELETION (inframe_deletion) One or many codons are deleted e.g.: A deletion multiple of three at codon boundary MODERATE</option>
267 <option value="CODON_CHANGE_PLUS_CODON_DELETION">CODON_CHANGE_PLUS_CODON_DELETION (disruptive_inframe_deletion) One codon is changed and one or more codons are deleted e.g.: A deletion of size multiple of three, not at codon boundary MODERATE</option>
268 <option value="DOWNSTREAM">DOWNSTREAM (downstream_gene_variant) Downstream of a gene (default length: 5K bases) MODIFIER</option>
269 <option value="EXON">EXON (exon_variant) The variant hits an exon (from a non-coding transcript) or a retained intron. MODIFIER</option>
270 <option value="EXON_DELETED">EXON_DELETED (exon_loss_variant) A deletion removes the whole exon. HIGH</option>
271 <option value="FRAME_SHIFT">FRAME_SHIFT (frameshift_variant) Insertion or deletion causes a frame shift e.g.: An indel size is not multple of 3 HIGH</option>
272 <option value="GENE">GENE (gene_variant) The variant hits a gene. MODIFIER</option>
273 <option value="INTERGENIC">INTERGENIC (intergenic_region) The variant is in an intergenic region MODIFIER</option>
274 <option value="INTERGENIC_CONSERVED">INTERGENIC_CONSERVED (conserved_intergenic_variant) The variant is in a highly conserved intergenic region MODIFIER</option>
275 <option value="INTRAGENIC">INTRAGENIC (intragenic_variant) The variant hits a gene, but no transcripts within the gene MODIFIER</option>
276 <option value="INTRON">INTRON (intron_variant) Variant hits and intron. Technically, hits no exon in the transcript. MODIFIER</option>
277 <option value="INTRON_CONSERVED">INTRON_CONSERVED (conserved_intron_variant) The variant is in a highly conserved intronic region MODIFIER</option>
278 <option value="MICRO_RNA">MICRO_RNA (miRNA) Variant affects an miRNA MODIFIER</option>
279 <option value="NON_SYNONYMOUS_CODING">NON_SYNONYMOUS_CODING (missense_variant) Variant causes a codon that produces a different amino acid e.g.: Tgg/Cgg, W/R MODERATE</option>
280 <option value="NON_SYNONYMOUS_START">NON_SYNONYMOUS_START (initiator_codon_variant) Variant causes start codon to be mutated into another start codon (the new codon produces a different AA). e.g.: Atg/Ctg, M/L (ATG and CTG can be START codons) LOW</option>
281 <option value="NON_SYNONYMOUS_STOP">NON_SYNONYMOUS_STOP (stop_retained_variant) Variant causes stop codon to be mutated into another stop codon (the new codon produces a different AA). e.g.: Atg/Ctg, M/L (ATG and CTG can be START codons) LOW</option>
282 <option value="RARE_AMINO_ACID">RARE_AMINO_ACID (rare_amino_acid_variant) The variant hits a rare amino acid thus is likely to produce protein loss of function HIGH</option>
283 <option value="SPLICE_SITE_ACCEPTOR">SPLICE_SITE_ACCEPTOR (splice_acceptor_variant) The variant hits a splice acceptor site (defined as two bases before exon start, except for the first exon). HIGH</option>
284 <option value="SPLICE_SITE_DONOR">SPLICE_SITE_DONOR (splice_donor_variant) The variant hits a Splice donor site (defined as two bases after coding exon end, except for the last exon). HIGH</option>
285 <option value="SPLICE_SITE_REGION">SPLICE_SITE_REGION (splice_region_variant) A sequence variant in which a change has occurred within the region of the splice site, either within 1-3 bases of the exon or 3-8 bases of the intron. LOW</option>
286 <option value="SPLICE_SITE_BRANCH">SPLICE_SITE_BRANCH (splice_region_variant) A varaint affective putative (Lariat) branch point, located in the intron. LOW</option>
287 <option value="SPLICE_SITE_BRANCH_U12">SPLICE_SITE_BRANCH_U12 (splice_region_variant) A varaint affective putative (Lariat) branch point from U12 splicing machinery, located in the intron. MODERATE</option>
288 <option value="STOP_LOST">STOP_LOST (stop_lost) Variant causes stop codon to be mutated into a non-stop codon e.g.: Tga/Cga, */R HIGH</option>
289 <option value="START_GAINED">START_GAINED (5_prime_UTR_premature start_codon_gain_variant) A variant in 5'UTR region produces a three base sequence that can be a START codon. LOW</option>
290 <option value="START_LOST">START_LOST (start_lost) Variant causes start codon to be mutated into a non-start codon. e.g.: aTg/aGg, M/R HIGH</option>
291 <option value="STOP_GAINED">STOP_GAINED (stop_gained) Variant causes a STOP codon e.g.: Cag/Tag, Q/* HIGH</option>
292 <option value="SYNONYMOUS_CODING">SYNONYMOUS_CODING (synonymous_variant) Variant causes a codon that produces the same amino acid e.g.: Ttg/Ctg, L/L LOW</option>
293 <option value="SYNONYMOUS_START">SYNONYMOUS_START (start_retained) Variant causes start codon to be mutated into another start codon. e.g.: Ttg/Ctg, L/L (TTG and CTG can be START codons) LOW</option>
294 <option value="SYNONYMOUS_STOP">SYNONYMOUS_STOP (stop_retained_variant) Variant causes stop codon to be mutated into another stop codon. e.g.: taA/taG, */* LOW</option>
295 <option value="TRANSCRIPT">TRANSCRIPT (transcript_variant) The variant hits a transcript. MODIFIER</option>
296 <option value="REGULATION">REGULATION (regulatory_region_variant) The variant hits a known regulatory feature (non-coding). MODIFIER</option>
297 <option value="UPSTREAM">UPSTREAM (upstream_gene_variant) Upstream of a gene (default length: 5K bases) MODIFIER</option>
298 <option value="UTR_3_PRIME">UTR_3_PRIME (3_prime_UTR_variant) Variant hits 3'UTR region MODIFIER</option>
299 <option value="UTR_3_DELETED">UTR_3_DELETED (3_prime_UTR_truncation + exon_loss) The variant deletes an exon which is in the 3'UTR of the transcript MODERATE</option>
300 <option value="UTR_5_PRIME">UTR_5_PRIME (5_prime_UTR_variant) Variant hits 5'UTR region MODIFIER</option>
301 <option value="UTR_5_DELETED">UTR_5_DELETED (5_prime_UTR_truncation + exon_loss_variant) The variant deletes an exon which is in the 5'UTR of the transcript MODERATE</option>
302 </param>
303 </when>
304 </conditional>
305
306 <param name="offset" type="select" display="radio" label="Chromosomal position">
307 <option value="default" selected="true">Use default (based on input type)</option>
308 <option value="-0">Force zero-based positions (both input and output)</option>
309 <option value="-1">Force one-based positions (both input and output)</option>
310 </param>
311 <param argument="-chr" type="text" label="Text to prepend to chromosome name">
312 <help>
313 By default SnpEff simplifies all chromosome names. For instance 'chr1' is just '1'.
314 You can prepend any string you want to the chromosome name
315 </help>
316 <validator type="regex" message="No whitespace allowed">^\S*$</validator>
317 </param>
318 <param name="generate_stats" argument="-noStats" type="boolean" truevalue="" falsevalue="-noStats" checked="true" label="Produce Summary Stats" />
319 <param argument="-noLog" type="boolean" truevalue="-noLog" falsevalue="" checked="true" label="Suppress reporting usage statistics to server" />
320 </inputs>
321 <outputs>
322 <data name="snpeff_output" format="vcf">
323 <change_format>
324 <when input="outputConditional.outputFormat" value="bed" format="bed" />
325 <when input="outputConditional.outputFormat" value="bedAnn" format="bed" />
326 </change_format>
327 </data>
328 <data name="statsFile" format="html" label="${tool.name} on ${on_string} - HTML stats">
329 <filter>generate_stats == True</filter>
330 </data>
331 <data name="csvFile" format="csv" label="${tool.name} on ${on_string} - CSV stats">
332 <filter>csvStats == True</filter>
333 </data>
334 </outputs>
335 <tests>
336 <test>
337 <param name="input" ftype="vcf" value="input.vcf"/>
338 <param name="inputFormat" value="vcf"/>
339 <param name="outputFormat" value="vcf"/>
340 <param name="genome_version" value="NC_045512.2" />
341 <param name="udLength" value="0"/>
342 <param name="generate_stats" value="false"/>
343 <output name="snpeff_output" file="output.vcf" lines_diff="2"/>
344 </test>
345 </tests>
346 <help><![CDATA[
347 **What it does**
348
349 **This is a special edition of SnpEff tweaked for SARS-CoV-2 variant annotation.**
350
351 SnpEff is a variant annotation and effect prediction tool. It annotates and predicts the effects of genetic variants (such as amino acid changes).
352
353 A typical SnpEff use case would be:
354
355 - **Input**: The inputs are predicted variants (SNPs, insertions, deletions and MNPs). The input file is usually obtained as a result of a sequencing experiment, and it is usually in variant call format (VCF).
356 - **Output**: SnpEff analyzes the input variants. It annotates the variants and calculates the effects they produce on known genes (e.g. amino acid changes).
357
358 @SNPEFF_IN_GALAXY_INFO@
359 @EXTERNAL_DOCUMENTATION@
360 ]]>
361 </help>
362 <expand macro="citations" />
363 </tool>