comparison junction_saturation.xml @ 51:09846d5169fa draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/rseqc commit 37fb1988971807c6a072e1afd98eeea02329ee83
author iuc
date Tue, 14 Mar 2017 10:23:21 -0400
parents f242ee103277
children 5873cd7afb67
comparison
equal deleted inserted replaced
50:f242ee103277 51:09846d5169fa
1 <tool id="rseqc_junction_saturation" name="Junction Saturation" version="2.4galaxy1"> 1 <tool id="rseqc_junction_saturation" name="Junction Saturation" version="@WRAPPER_VERSION@">
2 <description>detects splice junctions from each subset and compares them to reference gene model</description> 2 <description>detects splice junctions from each subset and compares them to reference gene model</description>
3 3
4 <macros> 4 <macros>
5 <import>rseqc_macros.xml</import> 5 <import>rseqc_macros.xml</import>
6 </macros> 6 </macros>
7 7
8 <requirements> 8 <expand macro="requirements" />
9 <expand macro="requirement_package_r" />
10 <expand macro="requirement_package_numpy" />
11 <expand macro="requirement_package_rseqc" />
12 </requirements>
13 9
14 <expand macro="stdio" /> 10 <expand macro="stdio" />
15 11
16 <version_command><![CDATA[junction_saturation.py --version]]></version_command> 12 <version_command><![CDATA[junction_saturation.py --version]]></version_command>
17 13
18 <command><![CDATA[ 14 <command><![CDATA[
19 junction_saturation.py 15 junction_saturation.py
20 --input-file $input 16 --input-file '${input}'
21 --refgene $refgene 17 --refgene '${refgene}'
22 --out-prefix output 18 --out-prefix output
23 --min-intron $min_intron 19 --min-intron ${min_intron}
24 --min-coverage $min_coverage 20 --min-coverage ${min_coverage}
25 --mapq $mapq 21 --mapq ${mapq}
26 #if $percentiles.specifyPercentiles 22 #if str($percentiles_type.percentiles_type_selector) == "specify":
27 --percentile-floor $percentiles.lowBound 23 --percentile-floor ${percentiles_type.lowBound}
28 --percentile-ceiling $percentiles.upBound 24 --percentile-ceiling ${percentiles_type.upBound}
29 --percentile-step $percentiles.percentileStep 25 --percentile-step ${percentiles_type.percentileStep}
30 #end if 26 #end if
31 ]]> 27 ]]>
32 </command> 28 </command>
33 29
34 <inputs> 30 <inputs>
35 <param name="input" type="data" format="bam,sam" label="input bam/sam file" help="(--input-file)"/> 31 <expand macro="bam_sam_param" />
36 <param name="refgene" type="data" format="bed" label="reference gene model" help="(--refgene)"/> 32 <expand macro="refgene_param" />
37 <param name="min_intron" type="integer" value="50" label="Minimum intron length (bp, default=50)" help="(--min-intron)" /> 33 <expand macro="min_intron_param" />
38 <param name="min_coverage" type="integer" label="Minimum number of supporting reads to call a junction (default=1)" value="1" help="(--min-coverage)" /> 34 <param name="min_coverage" type="integer" label="Minimum number of supporting reads to call a junction (default=1)" value="1" help="(--min-coverage)" />
39 <param name="mapq" type="integer" label="Minimum mapping quality (default=30)" help="Minimum phred scale mapping quality to consider a read 'uniquely mapped' (--mapq)" value="30" /> 35 <expand macro="mapq_param" />
40 <conditional name="percentiles"> 36 <conditional name="percentiles_type">
41 <param name="specifyPercentiles" type="boolean" label="Specify sampling bounds and frequency" value="false"/> 37 <param name="percentiles_type_selector" type="select" label="Sampling bounds and frequency">
42 <when value="true"> 38 <option value="default" selected="true">Default sampling bounds and frequency</option>
39 <option value="specify">Specify sampling bounds and frequency</option>
40 </param>
41 <when value="specify">
43 <param name="lowBound" type="integer" value="5" label="Lower Bound Sampling Frequency (bp, default=5)" help="(--percentile-floor)"> 42 <param name="lowBound" type="integer" value="5" label="Lower Bound Sampling Frequency (bp, default=5)" help="(--percentile-floor)">
44 <validator type="in_range" min="0" max="100" /> 43 <validator type="in_range" min="0" max="100" />
45 </param> 44 </param>
46 <param name="upBound" type="integer" value="100" label="Upper Bound Sampling Frequency (bp, default=100)" help="(--percentile-ceiling)"> 45 <param name="upBound" type="integer" value="100" label="Upper Bound Sampling Frequency (bp, default=100)" help="(--percentile-ceiling)">
47 <validator type="in_range" min="0" max="100" /> 46 <validator type="in_range" min="0" max="100" />
48 </param> 47 </param>
49 <param name="percentileStep" type="integer" value="5" label="Sampling increment (default=5)" help="(--percentile-step)"> 48 <param name="percentileStep" type="integer" value="5" label="Sampling increment (default=5)" help="(--percentile-step)">
50 <validator type="in_range" min="0" max="100" /> 49 <validator type="in_range" min="0" max="100" />
51 </param> 50 </param>
52 </when> 51 </when>
53 <when value="false"/> 52 <when value="default"/>
54 </conditional> 53 </conditional>
54 <expand macro="rscript_output_param" />
55 </inputs> 55 </inputs>
56 56
57 <outputs> 57 <outputs>
58 <data format="txt" name="outputr" from_work_dir="output.junctionSaturation_plot.r" label="${tool.name} on ${on_string} (R Script)"/> 58 <expand macro="pdf_output_data" filename="output.junctionSaturation_plot.pdf" />
59 <data format="pdf" name="outputpdf" from_work_dir="output.junctionSaturation_plot.pdf" label="${tool.name} on ${on_string} (PDF)"/> 59 <expand macro="rscript_output_data" filename="output.junctionSaturation_plot.r" />
60 </outputs> 60 </outputs>
61 61
62 <tests> 62 <tests>
63 <test> 63 <test>
64 <param name="input" value="pairend_strandspecific_51mer_hg19_chr1_1-100000.bam"/> 64 <param name="input" value="pairend_strandspecific_51mer_hg19_chr1_1-100000.bam" />
65 <param name="refgene" value="hg19_RefSeq_chr1_1-100000.bed"/> 65 <param name="refgene" value="hg19_RefSeq_chr1_1-100000.bed" />
66 <output name="outputr" file="output.junctionSaturation_plot.r"/> 66 <param name="rscript_output" value="true" />
67 <output name="outputr" file="output.junctionSaturation_plot.r" compare="sim_size">
68 <assert_contents>
69 <has_line line="pdf('output.junctionSaturation_plot.pdf')" />
70 <has_line line="x=c(5,10,15,20,25,30,35,40,45,50,55,60,65,70,75,80,85,90,95,100)" />
71 </assert_contents>
72 </output>
73 <output name="outputpdf" file="output.junctionSaturation_plot.pdf" compare="sim_size" />
67 </test> 74 </test>
68 </tests> 75 </tests>
69 76
70 <help><![CDATA[ 77 <help><![CDATA[
71 junction_saturation.py 78 junction_saturation.py
103 ++++++++++++++ 110 ++++++++++++++
104 111
105 1. output.junctionSaturation_plot.r: R script to generate plot 112 1. output.junctionSaturation_plot.r: R script to generate plot
106 2. output.junctionSaturation_plot.pdf 113 2. output.junctionSaturation_plot.pdf
107 114
108 .. image:: http://rseqc.sourceforge.net/_images/junction_saturation.png 115 .. image:: $PATH_TO_IMAGES/junction_saturation.png
109 :height: 600 px 116 :height: 600 px
110 :width: 600 px 117 :width: 600 px
111 :scale: 80 % 118 :scale: 80 %
112 119
113 In this example, current sequencing depth is almost saturated for "known junction" (red line) detection because the number of "known junction" reaches a plateau. In other words, nearly all "known junctions" (expressed in this particular tissue) have already been detected, and continue sequencing will not detect additional "known junction" and will only increase junction coverage (i.e. junction covered by more reads). While current sequencing depth is not saturated for novel junctions (green). 120 In this example, current sequencing depth is almost saturated for "known junction" (red line) detection because the number of "known junction" reaches a plateau. In other words, nearly all "known junctions" (expressed in this particular tissue) have already been detected, and continue sequencing will not detect additional "known junction" and will only increase junction coverage (i.e. junction covered by more reads). While current sequencing depth is not saturated for novel junctions (green).
114 121
122 @ABOUT@
115 123
116 -----
117
118 About RSeQC
119 +++++++++++
120
121 The RSeQC_ package provides a number of useful modules that can comprehensively evaluate high throughput sequence data especially RNA-seq data. "Basic modules" quickly inspect sequence quality, nucleotide composition bias, PCR bias and GC bias, while "RNA-seq specific modules" investigate sequencing saturation status of both splicing junction detection and expression estimation, mapped reads clipping profile, mapped reads distribution, coverage uniformity over gene body, reproducibility, strand specificity and splice junction annotation.
122
123 The RSeQC package is licensed under the GNU GPL v3 license.
124
125 .. image:: http://rseqc.sourceforge.net/_static/logo.png
126
127 .. _RSeQC: http://rseqc.sourceforge.net/
128 ]]> 124 ]]>
129 </help> 125 </help>
130 126
131 <expand macro="citations" /> 127 <expand macro="citations" />
132 128