# HG changeset patch
# User iuc
# Date 1547246628 18000
# Node ID 86d4303cc3ca50d7dd95d9093b3410a7b4c0dc34
# Parent cdd90678004a78d89816f5470c3909e90f3ffbed
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gemini commit 62ed732cba355e695181924a8ed4cce49ca21c59
diff -r cdd90678004a -r 86d4303cc3ca gemini_macros.xml
--- a/gemini_macros.xml Fri Dec 14 12:47:19 2018 -0500
+++ b/gemini_macros.xml Fri Jan 11 17:43:48 2019 -0500
@@ -1,15 +1,12 @@
- 0.18.1
+ 0.20.1
- 181
+ 200
gemini
- tabix
-
-
@@ -24,9 +21,17 @@
+
+
+
+ 10.1371/journal.pcbi.1003153
+
+
+
+
@@ -36,31 +41,36 @@
-
-
-
-
-
-
-
+
+
+
+
+
-
-
+
+
+
-
+
-
-
-
+
+
+
+
-
-
-
+
+
+
+
+
+
+
@@ -69,27 +79,23 @@
-
+
-
+
+
+
-
-
-
-
-
-
-
-
-
-
-
-
-
+
+
+
+
@@ -103,10 +109,90 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ value.strip()
+
+
+
+
+
+
+
+
+
+ value.strip()
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ value.strip()
+
+
+ not value or value.isdigit()
+
+
+ not value or value.isdigit()
+
+
+
+
@@ -119,67 +205,50 @@
#end if
-
- #if str($filter.filter_selector) == 'yes' and $filter.filter:
- --filter '${ str( $filter.filter ) }'
+
+ #if str($report.report_selector) == 'full':
+ #set cols = "*"
+ #else:
+ #if $report.columns and str($report.columns) != '':
+ #set $cols = str($report.columns)
+ #else
+ #set $cols = ''
+ #end if
+ #if str($report.extra_cols).strip():
+ #if $cols:
+ #set $cols = $cols + ', ' + str($report.extra_cols)
+ #else:
+ #set $cols = str($report.extra_cols)
+ #end if
+ #end if
+ #if not $cols:
+ #set $cols = "variant_id, gene"
+ #end if
#end if
- #if $report.report_selector != 'all':
- --columns "${report.columns}
- #if str($report.extra_cols).strip()
- #echo ','+','.join(str($report.extra_cols).split())
- #end if
- "
+ @SET_COLS@
+ #if $cols != "*"
+ --columns '$cols'
#end if
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- 10.1371/journal.pcbi.1003153
-
-
-
-
-
-
-
-
-
- value is not None and value.metadata.gemini_version == "@VERSION@"
-
-
-
+ = %d" % int($r.start))
+ #end if
+ #if str($r.stop).strip():
+ #silent $r_elements.append("end <= %d" % int($r.stop))
+ #end if
+ #silent $region_elements.append("(%s)" % " AND ".join($r_elements))
+ #end for
+ ]]>
+
diff -r cdd90678004a -r 86d4303cc3ca gemini_stats.xml
--- a/gemini_stats.xml Fri Dec 14 12:47:19 2018 -0500
+++ b/gemini_stats.xml Fri Jan 11 17:43:48 2019 -0500
@@ -1,4 +1,4 @@
-
+
Compute useful variant statistics
gemini_macros.xml
@@ -10,41 +10,83 @@
"${ outfile }"
+ #if str($stats.variants.constraint).strip():
+ #set $multiline_sql_expr = "select * from variants WHERE " + str($stats.variants.constraint)
+ #else:
+ #set $multiline_sql_expr = "select * from variants"
+ #end if
+ #set $cmdln_param = "--summarize"
+ @MULTILN_SQL_EXPR_TO_CMDLN@
+ #else:
+ ${stats.stats_option}
+ #end if
+ '$infile'
+ > '$outfile'
]]>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
@@ -52,21 +94,32 @@
-
-
+
+
+
+
+
-
+
+
+
+
+
+
@@ -74,31 +127,60 @@
ALT change
+in your database, e.g.::
type count
A->G 2
C->T 1
G->A 1
-EXAMPLE Calculate the site frequency spectrum of the variants; --sfs::
+**Transition / transversion statistics**
+
+This mode uses ``gemini stats`` with the ``--tstv``, ``--tstv-coding``, or
+``--tstv-noncoding`` option to compute the transition/transversion ratios for
+all SNPs, for SNPs in coding, or SNPs in non-coding regions, respectively.
+
+The result is presented in a 1x3 table listing the number of
+transitions (*ts* column), transversions (*tv* column) and the ratio of the two
+(*ts/tv* column), e.g.::
+
+ ts tv ts/tv
+ 126 39 3.2307
+
+**Alternate allele frequency spectrum**
+
+Runs ``gemini stats --sfs`` to produce binned alternate allele frequency counts
+in a table like::
aaf count
0.125 2
0.375 1
-EXAMPLE Compute the pair-wise genetic distance between each sample; --mds::
+**Pairwise genetic distances**
+
+Runs ``gemini stats --mds`` and tabulates all pairwise genetic distance for the
+samples in your database. An example could look like this::
sample1 sample2 distance
M10500 M10500 0.0
@@ -106,34 +188,6 @@
M10500 M10475 2.0
M10500 M10478 0.5714
-EXAMPLE Return a count of the types of genotypes per sample; --gts-by-sample::
-
- sample num_hom_ref num_het num_hom_alt num_unknown total
- M10475 4 1 3 1 9
- M10478 2 2 4 1 9
-
-
-
-EXAMPLE Return the total variants per sample (sum of homozygous and heterozygous variants); --vars-by-sample::
-
- sample total
- M10475 4
- M10478 6
-
-**Final solution**
-
---summarize:
- If none of these tools are exactly what you want, you can summarize the variants per sample of an arbitrary query using the –summarize flag.
-
-EXAMPLE If you wanted to know, for each sample, how many variants are on chromosome 1 that are also in dbSNP;--summarize "select * from variants where in_dbsnp=1 and chrom='chr1'"::
-
- sample total num_het num_hom_alt
- M10475 1 1 0
- M128215 1 1 0
- M10478 2 2 0
- M10500 2 1 1
-
-
]]>
diff -r cdd90678004a -r 86d4303cc3ca repository_dependencies.xml
--- a/repository_dependencies.xml Fri Dec 14 12:47:19 2018 -0500
+++ b/repository_dependencies.xml Fri Jan 11 17:43:48 2019 -0500
@@ -1,4 +1,4 @@
-
+
\ No newline at end of file
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_amend_input.db
Binary file test-data/gemini_amend_input.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_annotate_result.db
Binary file test-data/gemini_annotate_result.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_auto_dom_input.db
Binary file test-data/gemini_auto_dom_input.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_auto_rec_input.db
Binary file test-data/gemini_auto_rec_input.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_comphets_input.db
Binary file test-data/gemini_comphets_input.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_de_novo_input.db
Binary file test-data/gemini_de_novo_input.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_is_somatic_result.db
Binary file test-data/gemini_is_somatic_result.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_load_result1.db
Binary file test-data/gemini_load_result1.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_load_result2.db
Binary file test-data/gemini_load_result2.db has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/gemini_versioned_databases.loc
--- a/test-data/gemini_versioned_databases.loc Fri Dec 14 12:47:19 2018 -0500
+++ b/test-data/gemini_versioned_databases.loc Fri Jan 11 17:43:48 2019 -0500
@@ -1,3 +1,3 @@
## GEMINI versioned databases
#DownloadDate dbkey DBversion Description Path
-1999-01-01 hg19 181 GEMINI annotations (test snapshot) ${__HERE__}/test-cache
+1999-01-01 hg19 200 GEMINI annotations (test snapshot) ${__HERE__}/test-cache
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini-config.yaml
--- a/test-data/test-cache/gemini-config.yaml Fri Dec 14 12:47:19 2018 -0500
+++ b/test-data/test-cache/gemini-config.yaml Fri Jan 11 17:43:48 2019 -0500
@@ -2,12 +2,14 @@
versions:
ALL.wgs.phase3_shapeit2_mvncall_integrated_v5a.20130502.sites.tidy.vcf.gz: 4
ESP6500SI.all.snps_indels.tidy.v2.vcf.gz: 2
- ExAC.r0.3.sites.vep.tidy.vcf.gz: 3
+ ExAC.r0.3.sites.vep.tidy.vcf.gz: 4
GRCh37-gms-mappability.vcf.gz: 2
- clinvar_20160203.tidy.vcf.gz: 5
+ clinvar_20170130.tidy.vcf.gz: 5
cosmic-v68-GRCh37.tidy.vcf.gz: 3
- dbsnp.b141.20140813.hg19.tidy.vcf.gz: 4
+ dbsnp.b147.20160601.tidy.vcf.gz: 1
detailed_gene_table_v75: 2
geno2mp.variants.tidy.vcf.gz: 1
+ gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz: 2
hg19.rmsk.bed.gz: 2
summary_gene_table_v75: 2
+ whole_genome_SNVs.tsv.compressed.gz: 2
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz
Binary file test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz.tbi
Binary file test-data/test-cache/gemini/data/clinvar_20160203.tidy.vcf.gz.tbi has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz
Binary file test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz.tbi
Binary file test-data/test-cache/gemini/data/clinvar_20170130.tidy.vcf.gz.tbi has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz
Binary file test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz.tbi
Binary file test-data/test-cache/gemini/data/dbsnp.b141.20140813.hg19.tidy.vcf.gz.tbi has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz
Binary file test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz.tbi
Binary file test-data/test-cache/gemini/data/dbsnp.b147.20160601.tidy.vcf.gz.tbi has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz
Binary file test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz has changed
diff -r cdd90678004a -r 86d4303cc3ca test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz.tbi
Binary file test-data/test-cache/gemini/data/gnomad.exomes.r2.0.1.sites.no-VEP.nohist.tidy.vcf.gz.tbi has changed