# HG changeset patch # User iuc # Date 1547246628 18000 # Node ID 86d4303cc3ca50d7dd95d9093b3410a7b4c0dc34 # Parent cdd90678004a78d89816f5470c3909e90f3ffbed planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gemini commit 62ed732cba355e695181924a8ed4cce49ca21c59 diff -r cdd90678004a -r 86d4303cc3ca gemini_macros.xml --- a/gemini_macros.xml Fri Dec 14 12:47:19 2018 -0500 +++ b/gemini_macros.xml Fri Jan 11 17:43:48 2019 -0500 @@ -1,15 +1,12 @@ - 0.18.1 + 0.20.1 - 181 + 200 gemini - tabix - - @@ -24,9 +21,17 @@ + + + + 10.1371/journal.pcbi.1003153 + + + + @@ -36,31 +41,36 @@ - - - - - - - + + + + + - - + + + - + - - - + + + + - - - + + + + + + + @@ -69,27 +79,23 @@ - + - + + + - - - - - - - - - - - - - + + + + @@ -103,10 +109,90 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + value.strip() + + + + + + + + + + value.strip() + + + + + + + + + + + + + + + + + value.strip() + + + not value or value.isdigit() + + + not value or value.isdigit() + + + + @@ -119,67 +205,50 @@ #end if - - #if str($filter.filter_selector) == 'yes' and $filter.filter: - --filter '${ str( $filter.filter ) }' + + #if str($report.report_selector) == 'full': + #set cols = "*" + #else: + #if $report.columns and str($report.columns) != '': + #set $cols = str($report.columns) + #else + #set $cols = '' + #end if + #if str($report.extra_cols).strip(): + #if $cols: + #set $cols = $cols + ', ' + str($report.extra_cols) + #else: + #set $cols = str($report.extra_cols) + #end if + #end if + #if not $cols: + #set $cols = "variant_id, gene" + #end if #end if - #if $report.report_selector != 'all': - --columns "${report.columns} - #if str($report.extra_cols).strip() - #echo ','+','.join(str($report.extra_cols).split()) - #end if - " + @SET_COLS@ + #if $cols != "*" + --columns '$cols' #end if - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 10.1371/journal.pcbi.1003153 - - - - - - - - - - value is not None and value.metadata.gemini_version == "@VERSION@" - - - + = %d" % int($r.start)) + #end if + #if str($r.stop).strip(): + #silent $r_elements.append("end <= %d" % int($r.stop)) + #end if + #silent $region_elements.append("(%s)" % " AND ".join($r_elements)) + #end for + ]]> + diff -r cdd90678004a -r 86d4303cc3ca gemini_stats.xml --- a/gemini_stats.xml Fri Dec 14 12:47:19 2018 -0500 +++ b/gemini_stats.xml Fri Jan 11 17:43:48 2019 -0500 @@ -1,4 +1,4 @@ - + Compute useful variant statistics gemini_macros.xml @@ -10,41 +10,83 @@ "${ outfile }" + #if str($stats.variants.constraint).strip(): + #set $multiline_sql_expr = "select * from variants WHERE " + str($stats.variants.constraint) + #else: + #set $multiline_sql_expr = "select * from variants" + #end if + #set $cmdln_param = "--summarize" + @MULTILN_SQL_EXPR_TO_CMDLN@ + #else: + ${stats.stats_option} + #end if + '$infile' + > '$outfile' ]]> - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + @@ -52,21 +94,32 @@ - - + + + + + - + + + - + + + + + + - + @@ -74,31 +127,60 @@ ALT change +in your database, e.g.:: type count A->G 2 C->T 1 G->A 1 -EXAMPLE Calculate the site frequency spectrum of the variants; --sfs:: +**Transition / transversion statistics** + +This mode uses ``gemini stats`` with the ``--tstv``, ``--tstv-coding``, or +``--tstv-noncoding`` option to compute the transition/transversion ratios for +all SNPs, for SNPs in coding, or SNPs in non-coding regions, respectively. + +The result is presented in a 1x3 table listing the number of +transitions (*ts* column), transversions (*tv* column) and the ratio of the two +(*ts/tv* column), e.g.:: + + ts tv ts/tv + 126 39 3.2307 + +**Alternate allele frequency spectrum** + +Runs ``gemini stats --sfs`` to produce binned alternate allele frequency counts +in a table like:: aaf count 0.125 2 0.375 1 -EXAMPLE Compute the pair-wise genetic distance between each sample; --mds:: +**Pairwise genetic distances** + +Runs ``gemini stats --mds`` and tabulates all pairwise genetic distance for the +samples in your database. An example could look like this:: sample1 sample2 distance M10500 M10500 0.0 @@ -106,34 +188,6 @@ M10500 M10475 2.0 M10500 M10478 0.5714 -EXAMPLE Return a count of the types of genotypes per sample; --gts-by-sample:: - - sample num_hom_ref num_het num_hom_alt num_unknown total - M10475 4 1 3 1 9 - M10478 2 2 4 1 9 - - - -EXAMPLE Return the total variants per sample (sum of homozygous and heterozygous variants); --vars-by-sample:: - - sample total - M10475 4 - M10478 6 - -**Final solution** - ---summarize: - If none of these tools are exactly what you want, you can summarize the variants per sample of an arbitrary query using the –summarize flag. - -EXAMPLE If you wanted to know, for each sample, how many variants are on chromosome 1 that are also in dbSNP;--summarize "select * from variants where in_dbsnp=1 and chrom='chr1'":: - - sample total num_het num_hom_alt - M10475 1 1 0 - M128215 1 1 0 - M10478 2 2 0 - M10500 2 1 1 - - ]]> diff -r cdd90678004a -r 86d4303cc3ca repository_dependencies.xml --- a/repository_dependencies.xml Fri Dec 14 12:47:19 2018 -0500 +++ b/repository_dependencies.xml Fri Jan 11 17:43:48 2019 -0500 @@ -1,4 +1,4 @@ - + \ No newline at end of file diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_amend_input.db Binary file test-data/gemini_amend_input.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_annotate_result.db Binary file test-data/gemini_annotate_result.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_auto_dom_input.db Binary file test-data/gemini_auto_dom_input.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_auto_rec_input.db Binary file test-data/gemini_auto_rec_input.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_comphets_input.db Binary file test-data/gemini_comphets_input.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_de_novo_input.db Binary file test-data/gemini_de_novo_input.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_is_somatic_result.db Binary file test-data/gemini_is_somatic_result.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_load_result1.db Binary file test-data/gemini_load_result1.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_load_result2.db Binary file test-data/gemini_load_result2.db has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_versioned_databases.loc --- a/test-data/gemini_versioned_databases.loc Fri Dec 14 12:47:19 2018 -0500 +++ b/test-data/gemini_versioned_databases.loc Fri Jan 11 17:43:48 2019 -0500 @@ -1,3 +1,3 @@ ## GEMINI versioned databases #DownloadDate dbkey DBversion Description Path -1999-01-01 hg19 181 GEMINI annotations (test snapshot) ${__HERE__}/test-cache +1999-01-01 hg19 200 GEMINI annotations (test snapshot) ${__HERE__}/test-cache diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini-config.yaml --- a/test-data/test-cache/gemini-config.yaml Fri Dec 14 12:47:19 2018 -0500 +++ b/test-data/test-cache/gemini-config.yaml Fri Jan 11 17:43:48 2019 -0500 @@ -2,12 +2,14 @@ versions: ALL.wgs.phase3_shapeit2_mvncall_integrated_v5a.20130502.sites.tidy.vcf.gz: 4 ESP6500SI.all.snps_indels.tidy.v2.vcf.gz: 2 - ExAC.r0.3.sites.vep.tidy.vcf.gz: 3 + ExAC.r0.3.sites.vep.tidy.vcf.gz: 4 GRCh37-gms-mappability.vcf.gz: 2 - clinvar_20160203.tidy.vcf.gz: 5 + clinvar_20170130.tidy.vcf.gz: 5 cosmic-v68-GRCh37.tidy.vcf.gz: 3 - dbsnp.b141.20140813.hg19.tidy.vcf.gz: 4 + dbsnp.b147.20160601.tidy.vcf.gz: 1 detailed_gene_table_v75: 2 geno2mp.variants.tidy.vcf.gz: 1 + gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz: 2 hg19.rmsk.bed.gz: 2 summary_gene_table_v75: 2 + whole_genome_SNVs.tsv.compressed.gz: 2 diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz Binary file test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz.tbi Binary file test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz.tbi has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz Binary file test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz.tbi Binary file test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz.tbi has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz Binary file test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz.tbi Binary file test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz.tbi has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz Binary file test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz.tbi Binary file test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz.tbi has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz Binary file test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz has changed diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz.tbi Binary file test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz.tbi has changed