Mercurial > repos > iuc > gemini_burden
diff gemini_burden.xml @ 0:e799c1a6854b draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit 4bbfca6f0e9cae9a8f263aad4eab7304c96358c4
author | iuc |
---|---|
date | Thu, 18 Feb 2016 08:51:59 -0500 |
parents | |
children | c70d79e0eed7 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/gemini_burden.xml Thu Feb 18 08:51:59 2016 -0500 @@ -0,0 +1,152 @@ +<tool id="gemini_@BINARY@" name="GEMINI @BINARY@" version="@VERSION@.0"> + <description>perform sample-wise gene-level burden calculations</description> + <macros> + <import>gemini_macros.xml</import> + <token name="@BINARY@">burden</token> + </macros> + <expand macro="requirements" /> + <expand macro="stdio" /> + <expand macro="version_command" /> + <command> +<![CDATA[ + gemini @BINARY@ + --cases $cases + --controls $controls + $save_tscores + $nonsynonymous + $calpha + --permutations $permutations + #if float( str($min_aaf) ) >= 0.0: + --min-aaf $min_aaf + #end if + #if float( str($max_aaf) ) >= 0.0: + --max-aaf $max_aaf + #end if + "${ infile }" + > "${ outfile }" +]]> + + </command> + <inputs> + <expand macro="infile" /> + + <param name="cases" type="text" value="" label="Space separated list of cases for association testing" help="(--cases)"/> + <param name="controls" type="text" value="" label="Space separated list of controls for association testing" help="(--controls)"/> + + <param name="save_tscores" type="boolean" truevalue="--save_tscores" falsevalue="" checked="False" + label="Save the permuted T-scores in the output file" help="(--save_tscores)"/> + + <param name="nonsynonymous" type="boolean" truevalue="--nonsynonymous" falsevalue="" checked="False" + label="Count all nonsynonymous variants as contributing burden" help="(--nonsynonymous)"/> + <param name="calpha" type="boolean" truevalue="--calpha" falsevalue="" checked="False" + label="Run the C-alpha association test" help="(--calpha)"/> + <param name="min_aaf" type="float" value="-1" label="The min. alt. allele frequency for a variant to be included" + help="(--min-aaf)"> + <!--validator type="in_range" min="0.0"/--> + </param> + <param name="max_aaf" type="float" value="-1" label="The max. alt. allele frequency for a variant to be included" + help="(--max-aaf)"> + <!--validator type="in_range" min="0.0"/--> + </param> + + <param name="permutations" type="integer" value="1000" label="Number of permutations to run for the C-alpha test" + help="(--permutations)"> + <validator type="in_range" min="0"/> + </param> + + </inputs> + <outputs> + <data name="outfile" format="tabular" /> + </outputs> + <tests> + <test> + <param name="infile" value="gemini_burden_input.db" ftype="gemini.sqlite" /> + <param name="controls" value="M10475 M10478" /> + <param name="cases" value="M10500 M128215" /> + <param name="calpha" value="True" /> + <output name="outfile" file="gemini_burden_result.tabular" /> + </test> + </tests> + <help><![CDATA[ +**What it does** + +Burden performs sample-wise gene-level burden calculations. + +The burden tool provides a set of utilities to perform burden summaries on a per-gene, per sample basis. By default, it outputs a table of gene-wise counts of all high impact variants in coding regions for each sample: + +GEMINI burden example:: + + gene M10475 M10478 M10500 M128215 + WDR37 2 2 2 2 + CTBP2 0 0 0 1 + DHODH 1 0 0 0 + +**Setting examples** + +**--nonsynonymous** + +If you want to be a little bit less restrictive, you can include all non-synonymous variants instead. + +GEMINI output with setting --nonsynonymous:: + + gene M10475 M10478 M10500 M128215 + SYCE1 0 1 1 0 + WDR37 2 2 2 2 + CTBP2 0 0 0 1 + ASAH2C 2 1 1 0 + DHODH 1 0 0 0 + +**--calpha** + +If your database has been loaded with a PED file describing case and control samples, you can calculate the c-alpha statistic for cases vs. control. + +GEMINI output with setting --calpha:: + + gene T c Z p_value + SYCE1 -0.5 0.25 -1.0 0.841344746069 + WDR37 -1.0 1.5 -0.816496580928 0.792891910879 + CTBP2 0.0 0.0 nan nan + ASAH2C -0.5 0.75 -0.57735026919 0.718148569175 + DHODH 0.0 0.0 nan nan + +To calculate the **P-value** using a permutation test, use the --permutations option, specifying the number of permutations of the case/control labels you want to use. + +**--min-aaf and --max-aaf for --calpha** + +By default, all variants affecting a given gene will be included in the C-alpha computation. However, one may establish alternate allele frequency boundaries for the variants included using the --min-aaf and --max-aaf options. + +Used settings: + + - -calpha test.burden.db + - -min-aaf 0.0 + - -max-aaf 0.01 + - -cases + - -controls for --calpha + +If you do not have a PED file loaded, or your PED file does not follow the standard PED phenotype encoding format you can still perform the c-alpha test, but you have to specify which samples are the control samples and which are the case samples. + +Used settings: + + - -controls M10475 M10478 + - -cases M10500 M128215 + - -calpha + +Output:: + + gene T c Z p_value + SYCE1 -0.5 0.25 -1.0 0.841344746069 + WDR37 -1.0 1.5 -0.816496580928 0.792891910879 + CTBP2 0.0 0.0 nan nan + ASAH2C -0.5 0.75 -0.57735026919 0.718148569175 + DHODH 0.0 0.0 nan nan + +**--nonsynonymous --calpha** + +If you would rather consider all nonsynonymous variants for the C-alpha test rather than just the medium and high impact variants, add the --nonsynonymous flag. + + + ]]></help> + <expand macro="citations"> + <citation type="doi">10.1371/journal.pgen.1001322</citation><!-- c-alpha citation --> + </expand> +</tool>