4
|
1 <tool id="kggseq_variant_selection" name="Variant selection with KGGSeq" version="1.4">
|
0
|
2 <description></description>
|
|
3 <requirements>
|
4
|
4 <requirement type="package" version="1.0_0_20160412">kggseq</requirement>
|
0
|
5 </requirements>
|
|
6 <command>
|
|
7 java -jar \$KGGSEQ_JAR_PATH/kggseq.jar
|
|
8 ## Environmental settings
|
|
9 --buildver hg19
|
|
10 --resource \$KGGSEQ_JAR_PATH/resources
|
|
11 --no-lib-check
|
|
12 --no-resource-check
|
|
13 --no-progress-check
|
|
14 --out results
|
|
15 --o-vcf
|
4
|
16 --no-gz
|
0
|
17
|
|
18 --vcf-file $inputFile
|
|
19 --ped-file $pedFile
|
|
20 --db-gene $db_gene
|
|
21 $composite_subject_id
|
|
22
|
1
|
23 ## Variant and genotype filters
|
|
24 #if str($variant_genotype_filters.variant_genotype_filters_select) == "yes"
|
3
|
25 $variant_genotype_filters.pass_variant_only
|
1
|
26 --seq-qual $variant_genotype_filters.seq_qual
|
|
27 --seq-mq $variant_genotype_filters.seq_mq
|
|
28 --seq-sb $variant_genotype_filters.seq_sb
|
|
29 --seq-fs $variant_genotype_filters.seq_fs
|
|
30 --min-heta $variant_genotype_filters.min_heta
|
|
31 --min-homa $variant_genotype_filters.min_homa
|
|
32 --min-hetu $variant_genotype_filters.min_hetu
|
|
33 --min-homu $variant_genotype_filters.min_homu
|
|
34 --min-obsa $variant_genotype_filters.min_obsa
|
|
35 --min-obsu $variant_genotype_filters.min_obsu
|
|
36 --min-obs $variant_genotype_filters.min_obs
|
|
37 #if str($variant_genotype_filters.hwe_control)
|
|
38 --hwe-control $variant_genotype_filters.hwe_control
|
0
|
39 #end if
|
1
|
40 #if str($variant_genotype_filters.hwe_case)
|
|
41 --hwe-case $variant_genotype_filters.hwe_case
|
|
42 #end if
|
|
43 #if str($variant_genotype_filters.hwe_all)
|
|
44 --hwe-all $variant_genotype_filters.hwe_all
|
0
|
45 #end if
|
1
|
46 --gty-qual $variant_genotype_filters.gty_qual
|
|
47 --gty-dp $variant_genotype_filters.gty_dp
|
|
48 --gty-sec-pl $variant_genotype_filters.gty_sec_pl
|
|
49 --gty-af-ref $variant_genotype_filters.gty_af_ref
|
|
50 --gty-af-het $variant_genotype_filters.gty_af_het
|
|
51 --gty-af-alt $variant_genotype_filters.gty_af_alt
|
0
|
52 #else
|
1
|
53 --no-qc
|
0
|
54 #end if
|
|
55
|
|
56 ## Genetic inheritance
|
|
57 #if str($genetic_filters.genetic_filters_select) == "yes"
|
|
58 #if str($genetic_filters.genetic_model.genetic_model_select) == "yes"
|
|
59 #if $genetic_filters.genetic_model.custom_genetic_params
|
|
60 --genotype-filter $genetic_filters.genetic_model.custom_genetic_params
|
|
61 #end if
|
|
62 #else
|
|
63 $genetic_filters.genetic_model.suggested_genetic_params
|
|
64 #end if
|
|
65 #end if
|
|
66
|
1
|
67 ## Homozygosity - IBS - IBD filters
|
|
68 #if str($hom_ibs_ibd_filters.hom_ibs_ibd_filters_select) == "yes"
|
|
69 #if str($hom_ibs_ibd_filters.homozygosity_case_filter)
|
|
70 --homozygosity-case-filter $hom_ibs_ibd_filters.homozygosity_case_filter
|
|
71 #end if
|
|
72 #if str($hom_ibs_ibd_filters.ibs_case_filter)
|
|
73 --ibs-case-filter $hom_ibs_ibd_filters.ibs_case_filter
|
|
74 #end if
|
|
75 #if str($hom_ibs_ibd_filters.ibd_annot) != 'None'
|
|
76 --ibd-annot $hom_ibs_ibd_filters.ibd_annot
|
|
77 #end if
|
|
78 #end if
|
|
79
|
0
|
80 ## Gene feature filters
|
|
81 #if str($gene_feature_filters.gene_feature_filters_select) == "yes" and $gene_feature_filters.gene_features
|
|
82 --gene-feature-in $gene_feature_filters.gene_features
|
|
83 --splicing $gene_feature_filters.splicing
|
|
84 --neargene $gene_feature_filters.neargene
|
|
85 #end if
|
|
86
|
|
87 ## Common variants filters
|
|
88 #if str($allele_freq_filters.allele_freq_filters_select) == "yes"
|
|
89 #if $allele_freq_filters.allele_freq_db
|
|
90 --db-filter $allele_freq_filters.allele_freq_db
|
|
91 #end if
|
|
92 --rare-allele-freq $allele_freq_filters.rare_allele_freq
|
|
93 #end if
|
|
94
|
|
95 ## Genomic regions filters
|
|
96 #if str($genomic_region_filters.genomic_region_filters_select) == "yes"
|
|
97 $genomic_region_filters.ignore_indel_or_snv
|
|
98 #if $genomic_region_filters.regions_in
|
|
99 --regions-in "$genomic_region_filters.regions_in"
|
|
100 #end if
|
|
101 #if $genomic_region_filters.regions_out
|
|
102 --regions-out "$genomic_region_filters.regions_out"
|
|
103 #end if
|
|
104 #if $genomic_region_filters.genes_in
|
|
105 --genes-in "$genomic_region_filters.genes_in"
|
|
106 #end if
|
|
107 #if $genomic_region_filters.genes_out
|
|
108 --genes-out "$genomic_region_filters.genes_out"
|
|
109 #end if
|
|
110 $genomic_region_filters.superdup
|
|
111 #if str($genomic_region_filters.gene_var_filter)
|
|
112 --gene-var-filter $genomic_region_filters.gene_var_filter
|
|
113 #end if
|
|
114 #end if
|
|
115
|
|
116 ## Predicted impact filters
|
|
117 #if str($impact_filters.impact_filters_select) == "yes"
|
|
118 --db-score dbnsfp
|
|
119 $impact_filters.filter_nondisease_variant
|
|
120 $impact_filters.mendel_causing
|
|
121 #end if
|
|
122
|
|
123 ## Add annotations
|
|
124 #if str($add_annotations.add_annotations_select) == "yes"
|
1
|
125 #if str($add_annotations.o_flanking_seq)
|
|
126 --o-flanking-seq $add_annotations.o_flanking_seq
|
|
127 #end if
|
0
|
128 $add_annotations.genome_annotation
|
|
129 $add_annotations.omim_annotation
|
4
|
130 $add_annotations.cosmic_annotation
|
|
131 $add_annotations.scsnv_annotation
|
|
132 $add_annotations.dgv_cnv_annotation
|
|
133 $add_annotations.superdup_annotation
|
|
134 $add_annotations.mouse_pheno_annotation
|
|
135 $add_annotations.zebrafish_pheno_annotation
|
|
136 $add_annotations.ddd_annotation
|
|
137 $add_annotations.patho_gene_predict_annotation
|
0
|
138 #if $add_annotations.pubmed_mining_gene
|
4
|
139 --phenotype-term "$add_annotations.pubmed_mining_gene" --pubmed-mining
|
0
|
140 #end if
|
|
141 #if str($add_annotations.shared_genes.shared_genes_select) == "yes"
|
|
142 --ppi-annot string
|
|
143 --candi-file $add_annotations.shared_genes.candi_file
|
|
144 --ppi-depth $add_annotations.shared_genes.ppi_depth
|
|
145 --pathway-annot $add_annotations.shared_genes.pathway_annot
|
|
146 #end if
|
|
147 #end if
|
|
148 > $logFile
|
|
149 </command>
|
|
150 <inputs>
|
|
151 <param name="inputFile" type="data" format="vcf" label="VCF Variant file (--vcf-file)" help="Coordinates must refer to hg19" />
|
|
152 <param name="pedFile" type="data" format="tabular" label="Pedigree (--ped-file)" />
|
1
|
153 <param name="composite_subject_id" type="boolean" truevalue="--composite-subject-id" falsevalue="" checked="false" label="Composite subject ID (--composite-subject-id)" />
|
0
|
154 <param name="db_gene" type="select" display="checkboxes" multiple="true" label="Database(s) to annotate and filter variants (--db-gene)">
|
|
155 <option value="refgene" selected="true">refgene: The RefGene database compiled by UCSC from hg19 refGene. Note: RefSeq has NO mitochondria gene definition</option>
|
1
|
156 <option value="gencode">gencode: The GENCODE gene sets. Note: GENCODE contains similar number of coding genes but more transcripts than RefGene. It HAS the mitochondria gene definition</option>
|
0
|
157 <option value="knowngene">knowngene: The UCSC knonwGene datasase compiled by UCSC from hg19 knownGene</option>
|
1
|
158 <option value="ensembl">ensembl: The Ensembl gene datasase compiled by UCSC from hg19 ensGene</option>
|
0
|
159 <validator type="no_options" message="Select at least one database" />
|
|
160 </param>
|
|
161
|
1
|
162 <!-- Variant and genotype quality control -->
|
|
163 <conditional name="variant_genotype_filters">
|
|
164 <param name="variant_genotype_filters_select" type="select" label="Specify variant and genotype quality filters?">
|
0
|
165 <option value="yes">Yes</option>
|
|
166 <option value="no" selected="true">No</option>
|
|
167 </param>
|
|
168 <when value="yes">
|
3
|
169 <param name="pass_variant_only" type="boolean" truevalue="--vcf-filter-in PASS" falsevalue="" checked="true" label="Don't include filtered loci (--vcf-filter-in PASS)" help="Keep only variants with FILTER equal to PASS" />
|
0
|
170 <param name="seq_qual" type="integer" value="50" label="Minimum overall Phred-scaled sequencing quality score for the variant (--seq-qual)" />
|
|
171 <param name="seq_mq" type="integer" value="20" label="Minimum overall Phred-scaled mapping quality score for the variant (--seq-mq)" />
|
|
172 <param name="seq_sb" type="float" value="-10" label="Maximal overall strand bias score for the variant (--seq-sb)" />
|
|
173 <param name="seq_fs" type="integer" value="60" label="Maximal overall strand bias Phred-scaled p-value (using Fisher's exact test) for the variant (--seq-fs)" />
|
1
|
174 <param name="min_heta" type="integer" value="0" label="Minimal observed number of heterozygote genotypes in cases (the affected) (--min-heta)" />
|
|
175 <param name="min_homa" type="integer" value="0" label="Minimal observed number of alternate homozygote genotypes in cases (the affected) (--min-homa)" />
|
|
176 <param name="min_hetu" type="integer" value="0" label="Minimal observed number of heterozygote genotypes in controls (the unaffected) (--min-hetu)" />
|
|
177 <param name="min_homu" type="integer" value="0" label="Minimal observed number of alternate homozygote genotypes in controls (the unaffected) (--min-homu)" />
|
|
178 <param name="min_obsa" type="integer" value="0" label="Minimal observed number of non-missing genotypes in cases (the affected) (--min-obsa)" />
|
|
179 <param name="min_obsu" type="integer" value="0" label="Minimal observed number of non-missing genotypes in controls (the unaffected) (--min-obsu)" />
|
|
180 <param name="min_obs" type="integer" value="1" label="Minimal observed number of non-missing genotypes in all samples (--min-obs)" />
|
0
|
181 <param name="hwe_control" type="float" value="" optional="true" label="Exclude variants in controls with the Hardy-Weinberg test p-value <= this value (--hwe-control)" />
|
|
182 <param name="hwe_case" type="float" value="" optional="true" label="Exclude variants in cases with the Hardy-Weinberg test p-value <= this value (--hwe-case)" />
|
|
183 <param name="hwe_all" type="float" value="" optional="true" label="Exclude variants in all subjects with the Hardy-Weinberg test p-value <= this value (--hwe-all)" />
|
|
184 <param name="gty_qual" type="integer" value="10" label="Minimum Phred-scaled genotyping quality (--gty-qual)" />
|
|
185 <param name="gty_dp" type="integer" value="4" label="Minimal read depth per genotype (--gty-dp)" />
|
|
186 <param name="gty_sec_pl" type="integer" value="20" label="Minimal value for second smallest normalized Phred-scaled genotype quality (--gty-sec-pl)" />
|
|
187 <param name="gty_af_ref" type="float" value="0.05" label="Maximal fraction of reads carrying alternative allele at a reference allele homozygous genotype (--gty-af-ref)" />
|
|
188 <param name="gty_af_het" type="float" value="0.25" label="Minimal fraction of reads carrying alternative allele at a heterozygous genotype (--gty-af-het)" />
|
|
189 <param name="gty_af_alt" type="float" value="0.5" label="Minimal fraction of reads carrying alternative allele at a alternative allele homozygous genotype (--gty-af-alt)" />
|
|
190 </when>
|
|
191 <when value="no" />
|
|
192 </conditional>
|
|
193
|
|
194 <!-- Genetic inheritance -->
|
|
195 <conditional name="genetic_filters">
|
|
196 <param name="genetic_filters_select" type="select" label="Specify genetic inheritance?">
|
|
197 <option value="yes">Yes</option>
|
|
198 <option value="no" selected="true">No</option>
|
|
199 </param>
|
|
200 <when value="yes">
|
|
201 <conditional name="genetic_model">
|
|
202 <param name="genetic_model_select" type="select" label="Specify advanced settings for genetic inheritance?">
|
|
203 <option value="yes">Yes</option>
|
|
204 <option value="no" selected="true">No</option>
|
|
205 </param>
|
|
206 <!-- Custom genetic filters -->
|
|
207 <when value="yes">
|
|
208 <param name="custom_genetic_params" type="select" display="checkboxes" multiple="true" label="Select genetic inheritance (advanced) (--genotype-filter)" help="Multiple filtration codes have logical OR relationship">
|
|
209 <option value="1">Exclude variants at which affected subjects have heterozygous genotypes (1)</option>
|
|
210 <option value="2">Exclude variants at which both affected and unaffected subjects have the same homozygous genotypes (2)</option>
|
|
211 <option value="3">Exclude variants at which affected subjects have reference homozygous genotypes (3)</option>
|
|
212 <option value="4">Exclude variants at which both affected and unaffected subjects have the same heterozygous genotypes (4)</option>
|
|
213 <option value="5">Exclude variants at which affected subjects have alternative homozygous genotypes (5)</option>
|
|
214 <option value="6">Exclude variants at which affected family members have NO shared alleles (6)</option>
|
|
215 <option value="7">ONLY include variants at which an offspring has one or two non-inherited alleles (7)</option>
|
|
216 </param>
|
|
217 </when>
|
|
218 <!-- Suggested genetic filters -->
|
|
219 <when value="no">
|
|
220 <param name="suggested_genetic_params" type="select" display="radio" label="Select genetic inheritance">
|
|
221 <option value="--genotype-filter 1,2,3">Recessive (--genotype-filter 1,2,3)</option>
|
|
222 <option value="--double-hit-gene-trio-filter" selected="true">Recessive and compound-heterozygous (--double-hit-gene-trio-filter)</option>
|
|
223 <option value="--double-hit-gene-phased-filter">Recessive and compound-heterozygous with phased samples (--double-hit-gene-phased-filter)</option>
|
|
224 <option value="--genotype-filter 2,3,4,5">Dominant (--genotype-filter 2,3,4,5)</option>
|
|
225 <option value="--genotype-filter 7">De novo mutation (--genotype-filter 7)</option>
|
|
226 <option value="--unique-gene-filter">Only genes on which EVERY affected subject has at least one case-unique alternative allele, but these alleles may be from different variants (--unique-gene-filter)</option>
|
|
227 </param>
|
|
228 </when>
|
|
229 </conditional>
|
|
230 </when>
|
|
231 <when value="no" />
|
|
232 </conditional>
|
|
233
|
1
|
234 <!-- Homozygosity filtering -->
|
|
235 <conditional name="hom_ibs_ibd_filters">
|
|
236 <param name="hom_ibs_ibd_filters_select" type="select" label="Specify homozygosity filters?">
|
|
237 <option value="yes">Yes</option>
|
|
238 <option value="no" selected="true">No</option>
|
|
239 </param>
|
|
240 <when value="yes">
|
|
241 <param name="homozygosity_case_filter" type="integer" value="" optional="true" label="Filter by Runs of Homozygosity (ROH) (--homozygosity-case-filter)" help="Minimal length (in kb) of consecutive homozygous genotype for each interesting variant" />
|
|
242 <param name="ibs_case_filter" type="integer" value="" optional="true" label="Filter by Identical by State (IBS) (--ibs-case-filter)" help="Minimal length (in kb) of the region in which there is at least one allele identical among all cases" />
|
|
243 <param name="ibd_annot" type="data" format="txt,tabular,bed" optional="true" label="Add Identical by Descent (IBD) annotation (--ibd-annot)" help="File with IBD or significant linkage regions. Variants within these regions will be highlighted. Note: title line CHR START END is needed" />
|
|
244 </when>
|
|
245 <when value="no" />
|
|
246 </conditional>
|
|
247
|
0
|
248 <!-- Gene feature filtering -->
|
|
249 <conditional name="gene_feature_filters">
|
|
250 <param name="gene_feature_filters_select" type="select" label="Specify gene feature filters?">
|
|
251 <option value="yes">Yes</option>
|
|
252 <option value="no" selected="true">No</option>
|
|
253 </param>
|
|
254 <when value="yes">
|
|
255 <param name="gene_features" type="select" display="checkboxes" multiple="true" label="Select gene features (--gene-feature-in)" help="Variants falling outside the selected regions will be excluded">
|
|
256 <option value="0" selected="true">Frame-shift</option>
|
|
257 <option value="1" selected="true">Loss of amino acids</option>
|
3
|
258 <option value="2" selected="true">Loss of start codon</option>
|
|
259 <option value="3" selected="true">Loss of stop codon (TAG, TAA, TGA)</option>
|
|
260 <option value="4" selected="true">Gain of stop codon (TAG, TAA, TGA)</option>
|
0
|
261 <option value="5" selected="true">Splicing</option>
|
3
|
262 <option value="6" selected="true">Missense</option>
|
|
263 <option value="7">Synonymous</option>
|
|
264 <option value="8">Exonic</option>
|
|
265 <option value="9">5-UTR</option>
|
|
266 <option value="10">3-UTR</option>
|
|
267 <option value="11">Intronic</option>
|
|
268 <option value="12">Upstream of transcription start site</option>
|
|
269 <option value="13">Downstream of transcription end site</option>
|
|
270 <option value="14">ncRNA</option>
|
|
271 <option value="15">Intergenic</option>
|
|
272 <option value="16">Monomorphic</option>
|
|
273 <option value="17">Unknown</option>
|
0
|
274 </param>
|
|
275 <param name="splicing" type="integer" value="2" label="Window size in base-pair around the splicing junction to flag the variant as splicing (--splicing)" />
|
1
|
276 <param name="neargene" type="integer" value="1000" label="Size in base-pair of region upstream and downstream (--neargene)" />
|
0
|
277 </when>
|
|
278 <when value="no" />
|
|
279 </conditional>
|
|
280
|
|
281 <!-- Allele frequency filtering -->
|
|
282 <conditional name="allele_freq_filters">
|
1
|
283 <param name="allele_freq_filters_select" type="select" label="Specify filters by allele frequency?">
|
0
|
284 <option value="yes">Yes</option>
|
|
285 <option value="no" selected="true">No</option>
|
|
286 </param>
|
|
287 <when value="yes">
|
4
|
288 <param name="allele_freq_db" type="select" display="checkboxes" multiple="true" label="Select databases for allelic frequency filtering (--db-filter)">
|
|
289 <option value="1kgeur201305">1KG EUR 201305: 495 subjects in the EUR panel of 1000 Genomes Project release in 2013 May (around 24.0 million sequence variants)</option>
|
|
290 <option value="1kgeas201305">1KG EAS 201305: 496 subjects in the EAS panel of 1000 Genomes Project release in 2013 May (around 23.5 million sequence variants)</option>
|
|
291 <option value="1kgafr201305">1KG AFR 201305: 645 subjects in the AFR panel of 1000 Genomes Project release in 2013 May (around 41.7 million sequence variants)</option>
|
|
292 <option value="1kgsas201305">1KG SAS 201305: 485 subjects in the SAS panel of 1000 Genomes Project release in 2013 May (around 26.7 million sequence variants)</option>
|
|
293 <option value="1kgamr201305">1KG AMR 201305: 346 subjects in the AMR panel of 1000 Genomes Project release in 2013 May (around 28.2 million sequence variants)</option>
|
1
|
294 <option value="1kg201305" selected="true">1KG 201305: 1000 Genomes Project 2013 May release</option>
|
|
295 <option value="1kg201204">1KG 201204: 1000 Genomes Project 2012 April release</option>
|
|
296 <option value="1kgafr201204">1KG 201204 AFR: 1000 Genomes Project 2012 April release - African</option>
|
|
297 <option value="1kgeur201204">1KG 201204 EUR: 1000 Genomes Project 2012 April release - European</option>
|
|
298 <option value="1kgamr201204">1KG 201204 AMR: 1000 Genomes Project 2012 April release - Mixed American</option>
|
|
299 <option value="1kgasn201204">1KG 201204 ASN: 1000 Genomes Project 2012 April release - Asian</option>
|
|
300 <option value="ESP6500AA" selected="true">ESP6500AA: African American dataset from NHLBI GO Exome Sequencing Project (ESP6500)</option>
|
|
301 <option value="ESP6500EA" selected="true">ESP6500EA: European American dataset from NHLBI GO Exome Sequencing Project (ESP6500)</option>
|
|
302 <option value="dbsnp141" selected="true">dnSNP 141</option>
|
|
303 <option value="dbsnp138">dbSNP 138</option>
|
|
304 <option value="dbsnp138nf">dbSNP 138nf: dbSNP version 138 without the flagged SNPs by UCSC. Flagged SNPs include SNPs clinically associated by dbSNP, mapped to a single location in the reference genome assembly, and not known to have a minor allele frequency of at least 1%</option>
|
|
305 <option value="dbsnp137">dbSNP 137</option>
|
|
306 <option value="dbsnp135">dbSNP 135</option>
|
|
307 <option value="exac">Exome Aggregation Consortium (ExAC): Variants from 61,486 unrelated individuals sequenced as part of various disease-specific and population genetic studies</option>
|
0
|
308 </param>
|
|
309 <param name="rare_allele_freq" type="float" value="0.01" label="Minor allele frequency (MAF) for selecting rare variants (--rare-allele-freq)" help="Set to >1 to only annotate MAF, without filtering" />
|
|
310 </when>
|
|
311 <when value="no" />
|
|
312 </conditional>
|
|
313
|
|
314 <!-- Variant type, region and gene filtering -->
|
|
315 <conditional name="genomic_region_filters">
|
|
316 <param name="genomic_region_filters_select" type="select" label="Specify variant type, region and gene filtering?">
|
|
317 <option value="yes">Yes</option>
|
|
318 <option value="no" selected="true">No</option>
|
|
319 </param>
|
|
320 <when value="yes">
|
|
321 <param name="ignore_indel_or_snv" type="select" label="Ignore indels or SNVs?">
|
|
322 <option value="" selected="true">No</option>
|
|
323 <option value="--ignore-indel">Ignore insertion and deletion sequence variants (indels) (--ignore-indel)</option>
|
|
324 <option value="--ignore-snv">Ignore single nucleotide variants (SNVs) (--ignore-snv)</option>
|
|
325 </param>
|
|
326 <param name="regions_in" type="text" label="Keep only variants within some genomic regions (--regions-in)" help="A comma-separated list of genomic regions, e.g. chrX,chrY:1-1000" />
|
|
327 <param name="regions_out" type="text" label="Ignore variants within some genomic regions (--regions-out)" help="A comma-separated list of genomic regions, e.g. chrX,chrY:1-1000" />
|
|
328 <param name="genes_in" type="text" label="Keep only variants within some genes (--genes-in)" help="A comma-separated list of gene symbols, e.g. TCF4,CNNM2,ANK3" />
|
|
329 <param name="genes_out" type="text" label="Ignore variants within some genes (--genes-out)" help="A comma-separated list of gene symbols, e.g. TCF4,CNNM2,ANK3" />
|
|
330 <param name="superdup" type="select" label="Annotate or filter out variants in super duplicate regions?" help="As defined in genomicSuperDups dataset from UCSC">
|
|
331 <option value="" selected="true">No</option>
|
|
332 <option value="--superdup-annot">Annotate variants in super duplicate regions (--superdup-annot)</option>
|
|
333 <option value="--superdup-filter">Filter out variants in super duplicate regions (--superdup-filter)</option>
|
|
334 </param>
|
|
335 <param name="gene_var_filter" type="integer" value="" optional="true" label="Filter out genes with at least this number of putative pathogenic variants (--gene-var-filter)" help="As a rule of thumb, it is safe to set a cutoff of 4 or more. " />
|
|
336 </when>
|
|
337 <when value="no" />
|
|
338 </conditional>
|
|
339
|
|
340 <!-- Predicted impact filtering -->
|
|
341 <conditional name="impact_filters">
|
|
342 <param name="impact_filters_select" type="select" label="Specify functional impact filters?">
|
|
343 <option value="yes">Yes</option>
|
|
344 <option value="no" selected="true">No</option>
|
|
345 </param>
|
|
346 <when value="yes">
|
1
|
347 <param name="filter_nondisease_variant" type="boolean" truevalue="--filter-nondisease-variant" falsevalue="" checked="false" label="Filter out variants predicted to be non-disease causal (--filter-nondisease-variant)" />
|
0
|
348 <param name="mendel_causing" type="boolean" truevalue="--mendel-causing-predict all" falsevalue="" checked="true" label="Predict Mendelian disease-causing variants by logistic regression model (--mendel-causing-predict)" />
|
|
349 </when>
|
|
350 <when value="no" />
|
|
351 </conditional>
|
|
352
|
|
353 <!-- Annotations -->
|
|
354 <conditional name="add_annotations">
|
|
355 <param name="add_annotations_select" type="select" label="Add annotations?">
|
|
356 <option value="yes">Yes</option>
|
|
357 <option value="no" selected="true">No</option>
|
|
358 </param>
|
|
359 <when value="yes">
|
2
|
360 <param name="o_flanking_seq" type="integer" value="" optional="true" label="Size in bp of flanking sequence to extract (--o-flanking-seq)" />
|
0
|
361 <param name="genome_annotation" type="boolean" truevalue="--genome-annot" falsevalue="" checked="true" label="Add genomic functional annotations (presudogenes, TFBS, enhancer, UniProt) (--genome-annot)" />
|
|
362 <param name="omim_annotation" type="boolean" truevalue="--omim-annot" falsevalue="" checked="true" label="Add OMIM annotation (--omim-annot)" />
|
4
|
363 <param name="cosmic_annotation" type="boolean" truevalue="--cosmic-annot" falsevalue="" checked="true" label="Add COSMIC annotation (--cosmic-annot)" />
|
|
364 <param name="scsnv_annotation" type="boolean" truevalue="--scsnv-annot" falsevalue="" checked="true" label="Potential of altering splicing (--scsnv-annot)" />
|
|
365 <param name="dgv_cnv_annotation" type="boolean" truevalue="--dgv-cnv-annot" falsevalue="" checked="true" label="Map a variant against known structure variation (--dgv-cnv-annot)" />
|
|
366 <param name="superdup_annotation" type="boolean" truevalue="--superdup-annot" falsevalue="" checked="true" label="Mark the variants in the super duplicate regions (--superdup-annot)" />
|
|
367 <param name="mouse_pheno_annotation" type="boolean" truevalue="--mouse-pheno" falsevalue="" checked="true" label="Annotate the genes with known mouse phenotypes as reference (--mouse-pheno)" />
|
|
368 <param name="zebrafish_pheno_annotation" type="boolean" truevalue="--zebrafish-pheno" falsevalue="" checked="true" label="Annotate the genes with known zebrafish phenotypes as reference (--zebrafish-pheno)" />
|
|
369 <param name="ddd_annotation" type="boolean" truevalue="--ddd-annot" falsevalue="" checked="true" label="Annotate by disease names in Deciphering Developmental Disorders (DDD) study (--ddd-annot)" />
|
|
370 <param name="patho_gene_predict_annotation" type="boolean" truevalue="--patho-gene-predict" falsevalue="" checked="true" label="Predict genes’ pathogenicity (--patho-gene-predict)" />
|
0
|
371 <param name="pubmed_mining_gene" type="text" label="Text mining in PubMed: search term(s) of interest (e.g. disease name)" help="A comma-separated list of search terms, each composed by plus-separated words, e.g. spinocerebellar+ataxia,other+search+term. If empty, no search will be performed" />
|
4
|
372 <!-- Shared protein-protein interactions and pathways -->
|
0
|
373 <conditional name="shared_genes">
|
|
374 <param name="shared_genes_select" type="select" label="Add annotations for shared interactions/pathways?">
|
|
375 <option value="yes">Yes</option>
|
|
376 <option value="no" selected="true">No</option>
|
|
377 </param>
|
|
378 <when value="yes">
|
|
379 <param name="candi_file" type="data" format="txt,tabular" label="List of candidate genes of interest (--candi-file)" />
|
|
380 <param name="ppi_depth" type="integer" value="1" label="Maximum distance of a protein-protein interaction (PPI) between candidate genes and genes containing the variants (--ppi-depth)" />
|
|
381 <param name="pathway_annot" type="select" label="Select databases for the identification of shared pathways between candidate genes and genes containing the variants (--pathway-annot)" help="Gene sets are extracted from MSigDB">
|
|
382 <option value="cura" selected="true">Curated gene sets (4850)</option>
|
|
383 <option value="cano">Canonical pathways (1452)</option>
|
|
384 <option value="onco">Oncogenic signatures (189)</option>
|
|
385 <option value="cmop">Computational gene sets (858)</option>
|
|
386 <option value="onto">Gene Ontology gene sets (1454)</option>
|
|
387 </param>
|
|
388 </when>
|
|
389 <when value="no" />
|
|
390 </conditional>
|
|
391 </when>
|
|
392 <when value="no" />
|
|
393 </conditional>
|
|
394 </inputs>
|
|
395 <outputs>
|
|
396 <data name="outVcf" format="vcf" label="${tool.name} on ${on_string}: VCF" from_work_dir="results.flt.vcf" />
|
|
397 <data name="outTabular" format="tabular" label="${tool.name} on ${on_string}: tabular" from_work_dir="results.flt.txt" />
|
|
398 <data name="outDoubleHitTriosGty" format="tabular" label="${tool.name} on ${on_string}: double-hit genotypes" from_work_dir="results.doublehit.gene.trios.flt.gty.txt">
|
|
399 <filter>genetic_filters['genetic_filters_select'] == "yes" and genetic_filters['genetic_model']['genetic_model_select'] == "no" and genetic_filters['genetic_model']['suggested_genetic_params'] == "--double-hit-gene-trio-filter"</filter>
|
|
400 </data>
|
|
401 <data name="outDoubleHitTriosCount" format="tabular" label="${tool.name} on ${on_string}: double-hit counts" from_work_dir="results.doublehit.gene.trios.flt.count.txt">
|
|
402 <filter>genetic_filters['genetic_filters_select'] == "yes" and genetic_filters['genetic_model']['genetic_model_select'] == "no" and genetic_filters['genetic_model']['suggested_genetic_params'] == "--double-hit-gene-trio-filter"</filter>
|
|
403 </data>
|
|
404 <data name="outDoubleHitPhasedGty" format="tabular" label="${tool.name} on ${on_string}: double-hit phased genotypes" from_work_dir="results.doublehit.gene.phased.flt.gty.txt">
|
|
405 <filter>genetic_filters['genetic_filters_select'] == "yes" and genetic_filters['genetic_model']['genetic_model_select'] == "no" and genetic_filters['genetic_model']['suggested_genetic_params'] == "--double-hit-gene-phased-filter"</filter>
|
|
406 </data>
|
|
407 <data name="outDoubleHitPhasedCount" format="tabular" label="${tool.name} on ${on_string}: double-hit phased counts" from_work_dir="results.doublehit.gene.phased.flt.count.txt">
|
|
408 <filter>genetic_filters['genetic_filters_select'] == "yes" and genetic_filters['genetic_model']['genetic_model_select'] == "no" and genetic_filters['genetic_model']['suggested_genetic_params'] == "--double-hit-gene-phased-filter"</filter>
|
|
409 </data>
|
|
410 <data name="logFile" format="txt" label="${tool.name} on ${on_string}: log" />
|
|
411 </outputs>
|
|
412 <help>
|
|
413 **What it does**
|
|
414
|
|
415 This tool uses `KGGSeq`_ to filter and prioritize genetic variants from sequencing data.
|
|
416
|
|
417 **License and citation**
|
|
418
|
|
419 This Galaxy tool is Copyright © 2013-2014 `CRS4 Srl.`_ and is released under the `MIT license`_.
|
|
420
|
|
421 .. _CRS4 Srl.: http://www.crs4.it/
|
|
422 .. _MIT license: http://opensource.org/licenses/MIT
|
|
423
|
|
424 You can use this tool only if you agree to the license terms of: `KGGSeq`_.
|
|
425
|
|
426 .. _KGGSeq: http://statgenpro.psychiatry.hku.hk/limx/kggseq/
|
|
427
|
|
428 If you use this tool, please cite:
|
|
429
|
|
430 - |Cuccuru2014|_
|
|
431 - |Li2012|_
|
|
432 - |Li2013|_.
|
|
433
|
|
434 .. |Cuccuru2014| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2014) Orione, a web-based framework for NGS analysis in microbiology. *Bioinformatics* 30(13), 1928-1929
|
|
435 .. _Cuccuru2014: http://bioinformatics.oxfordjournals.org/content/30/13/1928
|
|
436 .. |Li2012| replace:: Li, M.-X., *et al.* (2012) A comprehensive framework for prioritizing variants in exome sequencing studies of Mendelian diseases. *Nucleic Acids Res.* 40(7), e53
|
|
437 .. _Li2012: http://nar.oxfordjournals.org/content/40/7/e53
|
|
438 .. |Li2013| replace:: Li, M.-X., *et al.* (2013) Predicting Mendelian Disease-Causing Non-Synonymous Single Nucleotide Variants in Exome Sequencing Studies. *PLoS Genet.* 9(1), e1003143
|
|
439 .. _Li2013: http://www.plosgenetics.org/article/info:doi/10.1371/journal.pgen.1003143
|
|
440 </help>
|
|
441 </tool>
|