Mercurial > repos > jjohnson > filter_bed_on_splice_junctions
diff filter_bed_on_splice_junctions.xml @ 0:915e5c5e02e6 draft default tip
Uploaded
author | jjohnson |
---|---|
date | Wed, 05 Feb 2014 08:18:49 -0500 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/filter_bed_on_splice_junctions.xml Wed Feb 05 08:18:49 2014 -0500 @@ -0,0 +1,61 @@ +<?xml version="1.0"?> +<tool id="filter_bed_on_splice_junctions" name="Filter BED on splice junctions" version="0.0.1"> + <description>that are not in a reference bed file</description> + <command interpreter="python">filter_bed_on_splice_junctions.py --input "$input_bed" + --guided_junctions "$guided_junctions" + #if $leading_bp: + --leading_bp $leading_bp + #end if + #if $trailing_bp: + --trailing_bp $trailing_bp + #end if + --novel_junctions "$novel_junctions" + </command> + <inputs> + <param name="input_bed" type="data" format="bed" label="BED file" + help="e.g. tophat junctions.bed run without GTF option or no-novel-junctions"/> + <param name="guided_junctions" type="data" format="bed" optional="true" label="reference bed file" + help="e.g. tophat junctions.bed run with GTF option and no-novel-junctions"/> + <param name="leading_bp" type="integer" value="" min="0" optional="true" label="Extend the start position" + help="The number of base pairs to extend the start of the exon before the junction position"/> + <param name="trailing_bp" type="integer" value="" min="0" optional="true" label="Extend the end position" + help="The number of base pairs to extend the end of the exon after the junction position"/> + </inputs> + <stdio> + <exit_code range="1:" level="fatal" description="Error" /> + </stdio> + <outputs> + <data name="novel_junctions" metadata_source="input_bed" format="bed"/> + </outputs> + <tests> + <test> + <param name="input_bed" value="novel_splice_junctions.bed" ftype="bed" dbkey="hg19"/> + <param name="guided_junctions" value="gtf_splice_junctions.bed" ftype="bed" dbkey="hg19"/> + <param name="leading_bp" value="0"/> + <param name="trailing_bp" value="0"/> + <output name="novel_junctions" file="filtered_novel_splice_junctions.bed"/> + </test> + <test> + <param name="input_bed" value="novel_splice_junctions.bed" ftype="bed" dbkey="hg19"/> + <param name="guided_junctions" value="gtf_splice_junctions.bed" ftype="bed" dbkey="hg19"/> + <param name="leading_bp" value="10"/> + <param name="trailing_bp" value="10"/> + <output name="novel_junctions" file="extended_novel_splice_junctions.bed"/> + </test> + </tests> + <help> +**Filter BED on splice junctions** + +Filter out lines of a BED file that have junctions that are in in the reference bed file of known junctions. +The start position of the exon preceding the junction and the end position of the exon after the junction can be extended. +This is to compensate for alignments that may not include enough of the exons surrounding the junctions. + +A typical application would be to run tophat twice, +once with the --GTF and --no-novel-juncs options for well known splice junctions, +then a second time without those options to also include novel splice junctions. + +This application would filter out the well splice known junctions +from the run intended to find all splice junctions including novel ones. + + </help> +</tool>