1
|
1 <tool id="rnachipintegrator_canonical_genes" name="Analyse canonical genes against 'peak' data" version="@VERSION@.0">
|
0
|
2 <description>using RnaChipIntegrator</description>
|
|
3 <macros>
|
|
4 <import>rnachipintegrator_macros.xml</import>
|
|
5 </macros>
|
|
6 <expand macro="requirements" />
|
|
7 <expand macro="version_command" />
|
1
|
8 <command interpreter="bash"><![CDATA[
|
|
9 rnachipintegrator_wrapper.sh
|
|
10 #if $peaks_in.metadata.chromCol
|
|
11 --peak_cols=${peaks_in.metadata.chromCol},${peaks_in.metadata.startCol},${peaks_in.metadata.endCol}
|
|
12 #end if
|
|
13 #if str( $cutoff ) != ""
|
|
14 --cutoff=$cutoff
|
|
15 #else
|
|
16 --cutoff=0
|
0
|
17 #end if
|
1
|
18 #if str( $number ) != ""
|
|
19 --number=$number
|
|
20 #end if
|
|
21 --promoter_region=$promoter_start,$promoter_end
|
|
22 --edge=$edge
|
|
23 --xlsx_file "$xlsx_out"
|
|
24 --output_files "$peaks_per_feature_out" "$features_per_peak_out"
|
|
25 #if $output.compact_format
|
|
26 --compact
|
|
27 #else
|
|
28 #if $output.summary
|
|
29 --summary_files "$peaks_per_feature_summary" "$features_per_peak_summary"
|
0
|
30 #end if
|
1
|
31 ${output.pad_output}
|
0
|
32 #end if
|
1
|
33 "${canonical_genes.fields.path}" "$peaks_in"
|
|
34 ]]></command>
|
0
|
35 <inputs>
|
1
|
36 <param format="tabular" name="peaks_in" type="data" label="Peaks" />
|
|
37 <param name="canonical_genes" type="select" label="Canonical genes to analyse peaks against">
|
0
|
38 <options from_data_table="rnachipintegrator_canonical_genes">
|
|
39 </options>
|
|
40 </param>
|
1
|
41 <expand macro="analysis_options" />
|
|
42 <expand macro="output_options" />
|
0
|
43 </inputs>
|
|
44 <outputs>
|
|
45 <!-- Always produce XLS output -->
|
1
|
46 <data format="xlsx" name="xlsx_out"
|
|
47 label="All RnaChipIntegrator analyses: ${canonical_genes.fields.name} vs ${peaks_in.name} (Excel spreadsheet)" />
|
|
48 <data format="tabular" name="peaks_per_feature_out"
|
|
49 label="Nearest peaks to each gene: ${canonical_genes.fields.name} vs ${peaks_in.name}" />
|
|
50 <data format="tabular" name="features_per_peak_out"
|
|
51 label="Nearest genes to each peak: ${canonical_genes.fields.name} vs ${peaks_in.name}" />
|
|
52 <data format="tabular" name="peaks_per_feature_summary"
|
|
53 label="Nearest peaks to each gene (summary): ${canonical_genes.fields.name} vs ${peaks_in.name}" >
|
|
54 <filter>output['compact_format'] is False</filter>
|
|
55 <filter>output['summary'] is True</filter>
|
0
|
56 </data>
|
1
|
57 <data format="tabular" name="features_per_peak_summary"
|
|
58 label="Nearest genes to each peak (summary): ${canonical_genes.fields.name} vs ${peaks_in.name}" >
|
|
59 <filter>output['compact_format'] is False</filter>
|
|
60 <filter>output['summary'] is True</filter>
|
0
|
61 </data>
|
|
62 </outputs>
|
|
63 <tests>
|
1
|
64 <!--
|
|
65 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +summary mm9_canonical_genes.tsv mm9_summits.txt
|
|
66 -->
|
0
|
67 <test>
|
1
|
68 <param name="peaks_in" value="mm9_summits.txt" ftype="tabular" />
|
0
|
69 <param name="canonical_genes" value="mm9_test" />
|
1
|
70 <param name="cutoff" value="50000" />
|
|
71 <output name="xlsx_out" file="mm9_summits.xlsx" compare="sim_size" />
|
|
72 <output name="peaks_per_feature_out" ftype="tabular"
|
|
73 file="mm9_summits_per_feature.out" />
|
|
74 <output name="features_per_peak_out" ftype="tabular"
|
|
75 file="mm9_features_per_summit.out" />
|
0
|
76 </test>
|
1
|
77 <!--
|
|
78 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +compact mm9_canonical_genes.tsv mm9_peaks.txt
|
|
79 -->
|
0
|
80 <test>
|
1
|
81 <param name="peaks_in" value="mm9_peaks.txt" ftype="tabular" />
|
0
|
82 <param name="canonical_genes" value="mm9_test" />
|
1
|
83 <param name="cutoff" value="50000" />
|
|
84 <output name="xlsx_out" file="mm9_peaks1.xlsx" compare="sim_size" />
|
|
85 <output name="peaks_per_feature_out" ftype="tabular"
|
|
86 file="mm9_peaks_per_feature1.out" />
|
|
87 <output name="features_per_peak_out" ftype="tabular"
|
|
88 file="mm9_features_per_peak1.out" />
|
|
89 </test>
|
|
90 <!--
|
|
91 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +summary +pad mm9_canonical_genes.tsv mm9_peaks.txt
|
|
92 -->
|
|
93 <test>
|
|
94 <param name="peaks_in" value="mm9_peaks.txt" ftype="tabular" />
|
|
95 <param name="canonical_genes" value="mm9_test" />
|
|
96 <param name="cutoff" value="50000" />
|
|
97 <param name="compact_format" value="false" />
|
|
98 <param name="summary" value="true" />
|
|
99 <param name="pad_output" value="true" />
|
|
100 <output name="xlsx_out" file="mm9_peaks3.xlsx" compare="sim_size" />
|
|
101 <output name="peaks_per_feature_out" ftype="tabular"
|
|
102 file="mm9_peaks_per_feature3.out" />
|
|
103 <output name="features_per_peak_out" ftype="tabular"
|
|
104 file="mm9_features_per_peak3.out" />
|
|
105 <output name="peaks_per_feature_summary" ftype="tabular"
|
|
106 file="mm9_peaks_per_feature3.summary" />
|
|
107 <output name="features_per_peak_summary" ftype="tabular"
|
|
108 file="mm9_features_per_peak3.summary" />
|
0
|
109 </test>
|
|
110 </tests>
|
|
111 <help>
|
|
112
|
|
113 .. class:: infomark
|
|
114
|
|
115 **What it does**
|
|
116
|
1
|
117 Performs integrated analyses of a set of peaks (e.g. ChIP data) against a
|
|
118 list of "canonical genes" for a specific organism and genome build,
|
|
119 identifying the nearest peaks to each canonical gene (and vice versa).
|
0
|
120
|
1
|
121 RnaChipIntegrator can be obtained from
|
0
|
122 http://fls-bioinformatics-core.github.com/RnaChipIntegrator/
|
|
123
|
|
124 -------------
|
|
125
|
|
126 .. class:: infomark
|
|
127
|
|
128 **Input**
|
|
129
|
1
|
130 The peak data must be in a tabular file with at least 3 columns of data
|
|
131 for each peak (one peak per line):
|
0
|
132
|
1
|
133 ====== ========== =================================
|
0
|
134 Column Name Description
|
1
|
135 ====== ========== =================================
|
|
136 1 chr Chromosome name
|
|
137 2 start Start position of the peak
|
|
138 3 end End position of the peak
|
|
139 ====== ========== =================================
|
0
|
140
|
|
141 -------------
|
|
142
|
|
143 .. class:: infomark
|
|
144
|
1
|
145 **Outputs**
|
|
146
|
|
147 The key outputs from the tool are two lists compromising the nearest
|
|
148 peaks for each gene, and the nearest gene for each peak (one
|
|
149 dataset for each list).
|
|
150
|
|
151 There are two formats for reporting: "compact" and "full":
|
0
|
152
|
1
|
153 * **Compact output** reports all the hits for each peak or gene on
|
|
154 a single line of output;
|
|
155 * **Full output** reports each peak/gene pair on a separate line
|
|
156 (i.e. a multi-line output format).
|
|
157
|
|
158 In "full" output mode, additional options are available:
|
|
159
|
|
160 * The output files can be "padded" with extra (empty) lines to ensure
|
|
161 that there are always the same number of lines for each peak or
|
|
162 gene, if fewer than the requested number of hits are found.
|
|
163 * "Summary" datasets can also be requested, which include just the
|
|
164 nearest peak reported for each gene (and vice versa).
|
0
|
165
|
1
|
166 In either mode these data will also be output in a single MS Excel file,
|
|
167 which contains one sheet per result set.
|
|
168
|
|
169 .. class:: warning
|
|
170
|
|
171 Using "compact" output with the number of hits limited to more than 4
|
|
172 peak/gene pairs (or with no limit at all) can result in a large number
|
|
173 of columns in the output files, which in some versions of Galaxy will
|
|
174 not be properly displayed. However the data files themselves should be
|
|
175 okay.
|
0
|
176
|
1
|
177 -------------
|
|
178
|
|
179 .. class:: informark
|
|
180
|
|
181 **More information**
|
|
182
|
|
183 It is recommended that you refer to the ``RnaChipIntegrator``
|
|
184 documentation for information on the contents of each output file:
|
|
185
|
|
186 * http://rnachipintegrator.readthedocs.org/en/latest/
|
0
|
187
|
|
188 -------------
|
|
189
|
|
190 .. class:: infomark
|
|
191
|
|
192 **Credits**
|
|
193
|
|
194 This Galaxy tool has been developed within the Bioinformatics Core Facility at the
|
|
195 University of Manchester. It runs the RnaChipIntegrator package which has also been
|
|
196 developed by this group, and is documented at
|
1
|
197 https://pypi.python.org/pypi/RnaChipIntegrator/
|
0
|
198
|
|
199 Please kindly acknowledge the Bioinformatics Core Facility if you use this tool.
|
|
200 </help>
|
1
|
201 <expand macro="citations" />
|
0
|
202 </tool>
|