Mercurial > repos > pjbriggs > rnachipintegrator
annotate rnachipintegrator_canonical_genes.xml @ 6:466c68008537 draft default tip
Updated for RnaChipIntegrator 3.0.0.
author | pjbriggs |
---|---|
date | Wed, 20 Mar 2024 09:11:04 +0000 |
parents | b695071de766 |
children |
rev | line source |
---|---|
4
b695071de766
Uploaded version 1.0.3.1 (switch to conda dependency resolution)
pjbriggs
parents:
1
diff
changeset
|
1 <tool id="rnachipintegrator_canonical_genes" name="Analyse canonical genes against 'peak' data" version="@VERSION@"> |
0 | 2 <description>using RnaChipIntegrator</description> |
3 <macros> | |
4 <import>rnachipintegrator_macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements" /> | |
7 <expand macro="version_command" /> | |
6 | 8 <command detect_errors="aggressive"><![CDATA[ |
9 bash $__tool_directory__/rnachipintegrator_wrapper.sh | |
1 | 10 #if $peaks_in.metadata.chromCol |
11 --peak_cols=${peaks_in.metadata.chromCol},${peaks_in.metadata.startCol},${peaks_in.metadata.endCol} | |
12 #end if | |
13 #if str( $cutoff ) != "" | |
14 --cutoff=$cutoff | |
15 #else | |
16 --cutoff=0 | |
0 | 17 #end if |
1 | 18 #if str( $number ) != "" |
19 --number=$number | |
20 #end if | |
21 --promoter_region=$promoter_start,$promoter_end | |
22 --edge=$edge | |
23 --xlsx_file "$xlsx_out" | |
24 --output_files "$peaks_per_feature_out" "$features_per_peak_out" | |
25 #if $output.compact_format | |
26 --compact | |
27 #else | |
28 #if $output.summary | |
29 --summary_files "$peaks_per_feature_summary" "$features_per_peak_summary" | |
0 | 30 #end if |
1 | 31 ${output.pad_output} |
0 | 32 #end if |
1 | 33 "${canonical_genes.fields.path}" "$peaks_in" |
34 ]]></command> | |
0 | 35 <inputs> |
1 | 36 <param format="tabular" name="peaks_in" type="data" label="Peaks" /> |
37 <param name="canonical_genes" type="select" label="Canonical genes to analyse peaks against"> | |
0 | 38 <options from_data_table="rnachipintegrator_canonical_genes"> |
39 </options> | |
40 </param> | |
1 | 41 <expand macro="analysis_options" /> |
42 <expand macro="output_options" /> | |
0 | 43 </inputs> |
44 <outputs> | |
45 <!-- Always produce XLS output --> | |
1 | 46 <data format="xlsx" name="xlsx_out" |
47 label="All RnaChipIntegrator analyses: ${canonical_genes.fields.name} vs ${peaks_in.name} (Excel spreadsheet)" /> | |
48 <data format="tabular" name="peaks_per_feature_out" | |
49 label="Nearest peaks to each gene: ${canonical_genes.fields.name} vs ${peaks_in.name}" /> | |
50 <data format="tabular" name="features_per_peak_out" | |
51 label="Nearest genes to each peak: ${canonical_genes.fields.name} vs ${peaks_in.name}" /> | |
52 <data format="tabular" name="peaks_per_feature_summary" | |
53 label="Nearest peaks to each gene (summary): ${canonical_genes.fields.name} vs ${peaks_in.name}" > | |
54 <filter>output['compact_format'] is False</filter> | |
55 <filter>output['summary'] is True</filter> | |
0 | 56 </data> |
1 | 57 <data format="tabular" name="features_per_peak_summary" |
58 label="Nearest genes to each peak (summary): ${canonical_genes.fields.name} vs ${peaks_in.name}" > | |
59 <filter>output['compact_format'] is False</filter> | |
60 <filter>output['summary'] is True</filter> | |
0 | 61 </data> |
62 </outputs> | |
63 <tests> | |
1 | 64 <!-- |
65 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +summary mm9_canonical_genes.tsv mm9_summits.txt | |
66 --> | |
0 | 67 <test> |
1 | 68 <param name="peaks_in" value="mm9_summits.txt" ftype="tabular" /> |
0 | 69 <param name="canonical_genes" value="mm9_test" /> |
1 | 70 <param name="cutoff" value="50000" /> |
71 <output name="xlsx_out" file="mm9_summits.xlsx" compare="sim_size" /> | |
72 <output name="peaks_per_feature_out" ftype="tabular" | |
73 file="mm9_summits_per_feature.out" /> | |
74 <output name="features_per_peak_out" ftype="tabular" | |
75 file="mm9_features_per_summit.out" /> | |
0 | 76 </test> |
1 | 77 <!-- |
78 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +compact mm9_canonical_genes.tsv mm9_peaks.txt | |
79 --> | |
0 | 80 <test> |
1 | 81 <param name="peaks_in" value="mm9_peaks.txt" ftype="tabular" /> |
0 | 82 <param name="canonical_genes" value="mm9_test" /> |
1 | 83 <param name="cutoff" value="50000" /> |
84 <output name="xlsx_out" file="mm9_peaks1.xlsx" compare="sim_size" /> | |
85 <output name="peaks_per_feature_out" ftype="tabular" | |
86 file="mm9_peaks_per_feature1.out" /> | |
87 <output name="features_per_peak_out" ftype="tabular" | |
88 file="mm9_features_per_peak1.out" /> | |
89 </test> | |
90 <!-- | |
91 RnaChipIntegrator +name=mm9 +cutoff=50000 +xlsx +summary +pad mm9_canonical_genes.tsv mm9_peaks.txt | |
92 --> | |
93 <test> | |
94 <param name="peaks_in" value="mm9_peaks.txt" ftype="tabular" /> | |
95 <param name="canonical_genes" value="mm9_test" /> | |
96 <param name="cutoff" value="50000" /> | |
97 <param name="compact_format" value="false" /> | |
98 <param name="summary" value="true" /> | |
99 <param name="pad_output" value="true" /> | |
100 <output name="xlsx_out" file="mm9_peaks3.xlsx" compare="sim_size" /> | |
101 <output name="peaks_per_feature_out" ftype="tabular" | |
102 file="mm9_peaks_per_feature3.out" /> | |
103 <output name="features_per_peak_out" ftype="tabular" | |
104 file="mm9_features_per_peak3.out" /> | |
105 <output name="peaks_per_feature_summary" ftype="tabular" | |
106 file="mm9_peaks_per_feature3.summary" /> | |
107 <output name="features_per_peak_summary" ftype="tabular" | |
108 file="mm9_features_per_peak3.summary" /> | |
0 | 109 </test> |
110 </tests> | |
111 <help> | |
112 | |
113 .. class:: infomark | |
114 | |
115 **What it does** | |
116 | |
1 | 117 Performs integrated analyses of a set of peaks (e.g. ChIP data) against a |
118 list of "canonical genes" for a specific organism and genome build, | |
119 identifying the nearest peaks to each canonical gene (and vice versa). | |
0 | 120 |
1 | 121 RnaChipIntegrator can be obtained from |
0 | 122 http://fls-bioinformatics-core.github.com/RnaChipIntegrator/ |
123 | |
124 ------------- | |
125 | |
126 .. class:: infomark | |
127 | |
128 **Input** | |
129 | |
1 | 130 The peak data must be in a tabular file with at least 3 columns of data |
131 for each peak (one peak per line): | |
0 | 132 |
1 | 133 ====== ========== ================================= |
0 | 134 Column Name Description |
1 | 135 ====== ========== ================================= |
136 1 chr Chromosome name | |
137 2 start Start position of the peak | |
138 3 end End position of the peak | |
139 ====== ========== ================================= | |
0 | 140 |
141 ------------- | |
142 | |
143 .. class:: infomark | |
144 | |
1 | 145 **Outputs** |
146 | |
147 The key outputs from the tool are two lists compromising the nearest | |
148 peaks for each gene, and the nearest gene for each peak (one | |
149 dataset for each list). | |
150 | |
151 There are two formats for reporting: "compact" and "full": | |
0 | 152 |
1 | 153 * **Compact output** reports all the hits for each peak or gene on |
154 a single line of output; | |
155 * **Full output** reports each peak/gene pair on a separate line | |
156 (i.e. a multi-line output format). | |
157 | |
158 In "full" output mode, additional options are available: | |
159 | |
160 * The output files can be "padded" with extra (empty) lines to ensure | |
161 that there are always the same number of lines for each peak or | |
162 gene, if fewer than the requested number of hits are found. | |
163 * "Summary" datasets can also be requested, which include just the | |
164 nearest peak reported for each gene (and vice versa). | |
0 | 165 |
1 | 166 In either mode these data will also be output in a single MS Excel file, |
167 which contains one sheet per result set. | |
168 | |
169 .. class:: warning | |
170 | |
171 Using "compact" output with the number of hits limited to more than 4 | |
172 peak/gene pairs (or with no limit at all) can result in a large number | |
173 of columns in the output files, which in some versions of Galaxy will | |
174 not be properly displayed. However the data files themselves should be | |
175 okay. | |
0 | 176 |
1 | 177 ------------- |
178 | |
179 .. class:: informark | |
180 | |
181 **More information** | |
182 | |
183 It is recommended that you refer to the ``RnaChipIntegrator`` | |
184 documentation for information on the contents of each output file: | |
185 | |
186 * http://rnachipintegrator.readthedocs.org/en/latest/ | |
0 | 187 |
188 ------------- | |
189 | |
190 .. class:: infomark | |
191 | |
192 **Credits** | |
193 | |
194 This Galaxy tool has been developed within the Bioinformatics Core Facility at the | |
195 University of Manchester. It runs the RnaChipIntegrator package which has also been | |
196 developed by this group, and is documented at | |
1 | 197 https://pypi.python.org/pypi/RnaChipIntegrator/ |
0 | 198 |
199 Please kindly acknowledge the Bioinformatics Core Facility if you use this tool. | |
200 </help> | |
1 | 201 <expand macro="citations" /> |
0 | 202 </tool> |