annotate picard_CollectInsertSizeMetrics.xml @ 1:5f1da1eadb39 draft default tip

add symlinked macros file
author avowinkel
date Mon, 06 Jul 2015 14:48:21 -0400
parents 5166ed57b1c4
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
1 <tool name="CollectInsertSizeMetrics" id="picard_CollectInsertSizeMetrics" version="1.135">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
2 <description>plots distribution of insert sizes</description>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
3 <macros>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
4 <import>picard_macros.xml</import>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
5 </macros>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
6 <expand macro="requirements">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
7 <requirement type="package" version="3.1.2">R</requirement>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
8 </expand>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
9 <command>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
10 @java_options@
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
11 ##set up input files
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
12
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
13 #set $reference_fasta_filename = "localref.fa"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
14
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
15 #if str( $reference_source.reference_source_selector ) == "history":
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
16 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &amp;&amp;
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
17 #else:
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
18 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
19 #end if
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
20
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
21 java -jar \$JAVA_JAR_PATH/picard.jar
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
22 CollectInsertSizeMetrics
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
23 INPUT="${inputFile}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
24 OUTPUT="${outFile}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
25 HISTOGRAM_FILE="${histFile}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
26 DEVIATIONS="${deviations}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
27
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
28 #if str( $hist_width ):
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
29 HISTOGRAM_WIDTH="${hist_width}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
30 #end if
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
31
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
32 MINIMUM_PCT="${min_pct}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
33 REFERENCE_SEQUENCE="${reference_fasta_filename}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
34 ASSUME_SORTED="${assume_sorted}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
35 METRIC_ACCUMULATION_LEVEL="${metric_accumulation_level}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
36
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
37 VALIDATION_STRINGENCY="${validation_stringency}"
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
38 QUIET=true
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
39 VERBOSITY=ERROR
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
40
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
41 </command>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
42 <inputs>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
43 <param format="sam,bam" name="inputFile" type="data" label="Select SAM/BAM dataset or dataset collection" help="If empty, upload or import a SAM/BAM dataset."/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
44 <conditional name="reference_source">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
45 <param name="reference_source_selector" type="select" label="Load reference genome from">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
46 <option value="cached">Local cache</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
47 <option value="history">History</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
48 </param>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
49 <when value="cached">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
50 <param name="ref_file" type="select" label="Using reference genome" help="REFERENCE_SEQUENCE">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
51 <options from_data_table="all_fasta">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
52 </options>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
53 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
54 </param>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
55 </when>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
56 <when value="history">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
57 <param name="ref_file" type="data" format="fasta" label="Use the folloing dataset as the reference sequence" help="REFERENCE_SEQUENCE; You can upload a FASTA sequence to the history and use it as reference" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
58 </when>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
59 </conditional>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
60 <param name="deviations" type="float" value="10.0" label="Generate mean, sd and plots by trimming the data down to MEDIAN + DEVIATIONS*MEDIAN_ABSOLUTE_DEVIATION" help="DEVIATIONS; This option is offered because insert size data typically includes enough anomalous values from chimeras and other artifacts to make the mean and SD grossly misleading regarding the real distribution. default=10.0"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
61 <param name="hist_width" type="integer" optional="True" label="Explicitly sets the Histogram width, overriding automatic truncation of Histogram tail" help="HISTOGRAM_WIDTH; optional"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
62 <param name="min_pct" type="float" value="0.05" label="When generating the Histogram, discard any data categories (out of FR, TANDEM, RF) that have fewer than this percentage of overall reads" help="MINIMUM_PCT; (Range: 0 to 1). default=0.05. "/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
63 <param name="assume_sorted" type="boolean" label="Assume the input file is already sorted" checked="true" truevalue="true" falsevalue="false" help="ASSUME_SORTED"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
64 <param name="metric_accumulation_level" type="select" label="The level(s) at which to accumulate metrics" multiple="true" help="METRIC_ACCUMULATION_LEVEL">
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
65 <option value="ALL_READS" selected="True">All reads</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
66 <option value="SAMPLE">Sample</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
67 <option value="LIBRARY">Library</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
68 <option value="READ_GROUP">Read group</option>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
69 </param>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
70
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
71 <expand macro="VS" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
72
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
73 </inputs>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
74
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
75 <outputs>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
76 <data format="tabular" name="outFile"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
77 <data format="pdf" name="histFile"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
78 </outputs>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
79
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
80 <tests>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
81 <test>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
82 <param name="metric_accumulation_level" value="ALL_READS"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
83 <param name="deviations" value="10.0" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
84 <param name="hist_width" value="500" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
85 <param name="min_pct" value="0.05" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
86 <param name="assume_sorted" value="true" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
87 <param name="reference_source_selector" value="history" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
88 <param name="ref_file" value="picard_CollectInsertSizeMetrics_ref.fa" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
89 <param name="inputFile" value="picard_CollectInsertSizeMetrics.bam" ftype="bam" />
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
90 <output name="outFile" file="picard_CollectInsertSizeMetrics_test1.tab" ftype="tabular" lines_diff="4"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
91 </test>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
92 </tests>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
93
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
94 <stdio>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
95 <exit_code range="1:" level="fatal"/>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
96 </stdio>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
97
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
98 <help>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
99
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
100 .. class:: infomark
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
101
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
102 **Purpose**
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
103
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
104 Reads a SAM or BAM dataset and writes a file containing metrics about the statistical distribution of insert size (excluding duplicates) and generates a Histogram plot.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
105
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
106 @dataset_collections@
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
107
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
108 @description@
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
109
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
110
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
111 DEVIATIONS=Double Generate mean, sd and plots by trimming the data down to MEDIAN +
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
112 DEVIATIONS*MEDIAN_ABSOLUTE_DEVIATION. This is done because insert size data typically
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
113 includes enough anomalous values from chimeras and other artifacts to make the mean and
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
114 sd grossly misleading regarding the real distribution. Default value: 10.0.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
115
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
116 HISTOGRAM_WIDTH=Integer
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
117 W=Integer Explicitly sets the Histogram width, overriding automatic truncation of Histogram tail.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
118 Also, when calculating mean and standard deviation, only bins &lt;= Histogram_WIDTH will be
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
119 included. Default value: not set.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
120
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
121 MINIMUM_PCT=Float
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
122 M=Float When generating the Histogram, discard any data categories (out of FR, TANDEM, RF) that
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
123 have fewer than this percentage of overall reads. (Range: 0 to 1). Default value: 0.05.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
124
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
125 METRIC_ACCUMULATION_LEVEL=MetricAccumulationLevel
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
126 LEVEL=MetricAccumulationLevel The level(s) at which to accumulate metrics. Possible values: {ALL_READS, SAMPLE,
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
127 LIBRARY, READ_GROUP} This option may be specified 0 or more times.
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
128
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
129 ASSUME_SORTED=Boolean
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
130 AS=Boolean If true (default), then the sort order in the header file will be ignored. Default
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
131 value: true. This option can be set to 'null' to clear the default value. Possible
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
132 values: {true, false}
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
133
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
134 @more_info@
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
135
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
136 </help>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
137 </tool>
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
138
5166ed57b1c4 Uploaded version 1.135
avowinkel
parents:
diff changeset
139