annotate inner_distance.xml @ 31:cc5eaa9376d8

Lance's updates
author nilesh
date Wed, 02 Oct 2013 02:20:04 -0400
parents adc934fb9a76
children 580ee0c4bc4e
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
1 <tool id="inner_distance" name="Inner Distance" version="1.1">
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
2 <description>calculate the inner distance (or insert size) between two paired RNA reads</description>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
3 <requirements>
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
4 <requirement type="package" version="2.11.0">R</requirement>
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
5 <requirement type="package" version="1.7.1">numpy</requirement>
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
6 <requirement type="package" version="2.3.7">rseqc</requirement>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
7 </requirements>
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
8 <command> inner_distance.py -i $input -o output -r $refgene
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
9
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
10 #if $bounds.hasLowerBound
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
11 -l $bounds.lowerBound
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
12 #end if
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
13
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
14 #if $bounds2.hasUpperBound
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
15 -u $bounds2.upperBound
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
16 #end if
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
17
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
18 #if $steps.step
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
19 -s $steps.stepSize
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
20 #end if
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
21 </command>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
22 <inputs>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
23 <param name="input" type="data" format="bam,sam" label="input bam/sam file" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
24 <param name="refgene" type="data" format="bed" label="reference gene model" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
25 <conditional name="bounds">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
26 <param name="hasLowerBound" type="boolean" label="Specify lower bound" value="false"/>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
27 <when value="true">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
28 <param name="lowerBound" type="integer" value="-250" label="Estimated Lower Bound (bp, default=-250)" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
29 </when>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
30 </conditional>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
31 <conditional name="bounds2">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
32 <param name="hasUpperBound" type="boolean" label="Specify upper bound" value="false" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
33 <when value="true">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
34 <param name="upperBound" type="integer" value="250" label="Estimated Upper Bound (bp, default=250)" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
35 </when>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
36 </conditional>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
37 <conditional name="steps">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
38 <param name="step" type="boolean" label="Specify step size" value="false" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
39 <when value="true">
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
40 <param name="stepSize" type="integer" value="5" label="Step size (bp, default=5)" />
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
41 </when>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
42 </conditional>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
43 </inputs>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
44 <outputs>
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
45 <data format="txt" name="outputtxt" from_work_dir="output.inner_distance.txt" label="${tool.name} on ${on_string} (Text)"/>
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
46 <data format="txt" name="outputfreqtxt" from_work_dir="output.inner_distance_freq.txt" label="${tool.name} on ${on_string} (Freq Text)" />
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
47 <data format="pdf" name="outputpdf" from_work_dir="output.inner_distance_plot.pdf" label="${tool.name} on ${on_string} (PDF)" />
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
48 <data format="r" name="outputr" from_work_dir="output.inner_distance_plot.r" label="${tool.name} on ${on_string} (R Script)" />
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
49 </outputs>
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
50 <stdio>
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
51 <exit_code range="1:" level="fatal" description="An error occured during execution, see stderr and stdout for more information" />
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
52 <regex match="[Ee]rror" source="both" description="An error occured during execution, see stderr and stdout for more information" />
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
53 </stdio>
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
54 <help>
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
55 inner_distance.py
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
56 +++++++++++++++++
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
57
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
58 This module is used to calculate the inner distance (or insert size) between two paired RNA
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
59 reads. The distance is the mRNA length between two paired fragments. We first determine the
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
60 genomic (DNA) size between two paired reads: D_size = read2_start - read1_end, then
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
61
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
62 * if two paired reads map to the same exon: inner distance = D_size
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
63 * if two paired reads map to different exons:inner distance = D_size - intron_size
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
64 * if two paired reads map non-exonic region (such as intron and intergenic region): inner distance = D_size
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
65 * The inner_distance might be a negative value if two fragments were overlapped.
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
66
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
67 NOTE: Not all read pairs were used to estimate the inner distance distribution. Those low
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
68 quality, PCR duplication, multiple mapped reads were skipped.
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
69
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
70 Inputs
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
71 ++++++++++++++
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
72
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
73 Input BAM/SAM file
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
74 Alignment file in BAM/SAM format.
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
75
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
76 Reference gene model
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
77 Gene model in BED format.
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
78
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
79 Estimated Upper/Lower Bounds (defaults=250 and -250)
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
80 Estimated upper/lower bounds of inner distance (bp).
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
81
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
82 Step size (default=5)
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
83 Step size of histogram
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
84
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
85
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
86 Output
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
87 ++++++++++++++
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
88
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
89 1. output.inner_distance.txt:
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
90 - first column is read ID
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
91 -second column is inner distance. Could be negative value if PE reads were overlapped or mapping error (e.g. Read1_start &lt; Read2_start, while Read1_end >> Read2_end due to spliced mapping of read1)
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
92 - third column indicates how paired reads were mapped: PE_within_same_exon, PE_within_diff_exon,PE_reads_overlap
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
93 2. output..inner_distance_freq.txt:
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
94 - inner distance starts
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
95 - inner distance ends
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
96 - number of read pairs
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
97 - note the first 2 columns are left side half open interval
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
98 3. output.inner_distance_plot.r: R script to generate histogram
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
99 4. output.inner_distance_plot.pdf: histogram plot
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
100
31
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
101 .. image:: http://rseqc.sourceforge.net/_images/inner_distance.png
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
102 :height: 600 px
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
103 :width: 600 px
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
104 :scale: 80 %
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
105
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
106
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
107 -----
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
108
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
109 About RSeQC
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
110 +++++++++++
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
111
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
112 The RSeQC_ package provides a number of useful modules that can comprehensively evaluate high throughput sequence data especially RNA-seq data. "Basic modules" quickly inspect sequence quality, nucleotide composition bias, PCR bias and GC bias, while "RNA-seq specific modules" investigate sequencing saturation status of both splicing junction detection and expression estimation, mapped reads clipping profile, mapped reads distribution, coverage uniformity over gene body, reproducibility, strand specificity and splice junction annotation.
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
113
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
114 The RSeQC package is licensed under the GNU GPL v3 license.
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
115
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
116 .. image:: http://rseqc.sourceforge.net/_static/logo.png
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
117
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
118 .. _RSeQC: http://rseqc.sourceforge.net/
cc5eaa9376d8 Lance's updates
nilesh
parents: 20
diff changeset
119
20
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
120
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
121 </help>
adc934fb9a76 Uploaded
nilesh
parents:
diff changeset
122 </tool>