Mercurial > repos > nilesh > tabix
changeset 1:eb790a7f5e7a draft
Uploaded
author | nilesh |
---|---|
date | Wed, 10 Jul 2013 15:06:23 -0400 |
parents | 6478acbb2c36 |
children | 438b5c8d736c |
files | tabix.xml |
diffstat | 1 files changed, 89 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tabix.xml Wed Jul 10 15:06:23 2013 -0400 @@ -0,0 +1,89 @@ +<tool id="tabix" name="tabix" version="0.0.1"> + <description>Generic indexer for TAB-delimited genome position files.</description> + <requirements> + <requirements type="package" version= "0.2.6">tabix</requirements> + </requirements> + <command> + tabix + #if str($position) == "no" + -0 + #end if + + #if str($options.extension) == "tabular" + #if str($options.columnseq) != "" + -s $options.columnseq + #end if + + #if str($options.columnstart) != "" + -b $options.columnstart + #end if + + #if str($options.columnend) != "" + -e $options.columnend + #end if + + #if str($options.skiplines) != "" + -S $options.skiplines + #end if + + #if str($options.skipchar) != "" + -c $options.skipchar + #end if + #else + -p + #end if + + $input $region + + </command> + <inputs> + <param name="input" type="data" label="Input file" format="gff,bed,sam,vcf,tabular"> + </param> + <param name="region" type="text" optional="true" label="Regions (seperate with spaces)"> </param> + <conditional name="optional"> + <param name= "extension" type="select" value= "tabular" label= "Input Extension"> + <option value="tabular">tabular</option> + <option value="gff">gff</option> + <option value="bed">bed</option> + <option value="sam">sam</option> + <option value="vcf">vcf</option> + </param> + <when value="tabular"> + <param name="columnseq" type="integer" optional= "true" label="Column of sequence name" /> + <param name="columnstart" type="integer" optional= "true" label="Column of start chromosomal position" /> + <param name="columnend" type="integer" optional= "true" label="Column of end chromosomal position" /> + <param name="skiplines" type="integer" optional= "true" label="Skip first INT lines" /> + <param name="skipchar" type="text" optional= "true" label="Skip lines started with CHAR" /> + <param name="position" type= "select" value= "yes" label="1-based? (if not, 0-based)"> + <option value= "yes">yes</option> + <option value= "no">no</option> + </param> + </when> + </conditional> + </inputs> + + <outputs> + <data format="tabular" name="output" /> + </outputs> + + <help> +**What it does:** + +Tabix indexes a TAB-delimited genome position file in.tab.bgz and creates an index file in.tab.bgz.tbi when region is absent from the command-line. The input data file must be position sorted and compressed by bgzip which has a gzip(1) like interface. After indexing, tabix is able to quickly retrieve data lines overlapping regions specified in the format "chr:beginPos-endPos". Fast data retrieval also works over network if URI is given as a file name and in this case the index file will be downloaded if it is not present locally. + +**Citation:** + +Tabix was written by Heng Li. The BGZF library was originally implemented by Bob Handsaker and modified by Heng Li for remote file access and in-memory caching. + +http://samtools.sourceforge.net/tabix.shtml + +**Example:** + +(grep ^"#" in.gff; grep -v ^"#" in.gff | sort -k1,1 -k4,4n) | bgzip > sorted.gff.gz; + +tabix -p gff sorted.gff.gz; + +tabix sorted.gff.gz chr1:10,000,000-20,000,000; + + </help> +</tool>