comparison fuma.xml @ 4:cb0543909e83 draft

planemo upload for repository https://github.com/ErasmusMC-Bioinformatics/fuma_galaxy_wrapper commit 36132cfcfe9203c499b73a2f0eea570c05e07ab8
author yhoogstrate
date Fri, 20 Nov 2015 11:05:18 -0500
parents 4966079d474b
children a5f10935f9ab
comparison
equal deleted inserted replaced
3:4966079d474b 4:cb0543909e83
1 <?xml version="1.0" encoding="UTF-8"?> 1 <?xml version="1.0" encoding="UTF-8"?>
2 <tool id="fuma" name="FuMa" version="2.10.0.a"> 2 <tool id="fuma" name="FuMa" version="2.11.0.a">
3 <description>match detected fusion genes based on gene names (in particular for RNA-Seq).</description> 3 <description>match detected fusion genes based on gene names (in particular for RNA-Seq)</description>
4 4
5 <requirements> 5 <requirements>
6 <requirement type="package" version="2.7">python</requirement> 6 <requirement type="package" version="2.7">python</requirement>
7 <requirement type="package" version="2.10.0">fuma</requirement> 7 <requirement type="package" version="2.11.0">fuma</requirement>
8 </requirements> 8 </requirements>
9 9
10 <version_command>fuma --version 2>&amp;1 | head -n 1</version_command><!-- -V also works, but is not GNU standard --> 10 <version_command>fuma --version 2>&amp;1 | head -n 1</version_command><!-- -V also works, but is not GNU standard -->
11 11
12 <command><![CDATA[ 12 <command><![CDATA[
73 <option value="tophat-fusion_pre">Tophat Fusion Pre (fusions.out)</option> 73 <option value="tophat-fusion_pre">Tophat Fusion Pre (fusions.out)</option>
74 <option value="tophat-fusion_post_potential_fusion">Tophat Fusion Post (potential_fusion.txt)</option> 74 <option value="tophat-fusion_post_potential_fusion">Tophat Fusion Post (potential_fusion.txt)</option>
75 <option value="tophat-fusion_post_result">Tophat Fusion Post (result.txt)</option> 75 <option value="tophat-fusion_post_result">Tophat Fusion Post (result.txt)</option>
76 <option value="tophat-fusion_post_result_html">Tophat Fusion Post (result.html)</option> 76 <option value="tophat-fusion_post_result_html">Tophat Fusion Post (result.html)</option>
77 </param> 77 </param>
78 <param name="gene_annotation" type="data" format="bed" label="Corresponding gene-name annotation file (BED format)" help="Make use of persistent gene annotations! Gene annotations should only be different if different reference genome builds were used." /> 78 <param name="gene_annotation" type="data" format="bed" label="Corresponding gene-name annotation file (BED format)" help="Make use of persistent gene annotations! Gene annotations should only be different if different reference genome builds were used" />
79 </repeat> 79 </repeat>
80 80
81 <conditional name="params"> 81 <conditional name="params">
82 <param name="settingsType" type="select" label="Settings to use" help="You can use the default settings or set custom values for any FuMa parameter."> 82 <param name="settingsType" type="select" label="Settings to use" help="You can use the default settings or set custom values for any FuMa parameter">
83 <option value="preSet" selected="true">Use Defaults</option> 83 <option value="preSet" selected="true">Use Defaults</option>
84 <option value="full">Full parameter list</option> 84 <option value="full">Full parameter list</option>
85 </param> 85 </param>
86 <when value="preSet"> 86 <when value="preSet">
87 <param name="strand_specific_matching" type="hidden" value="--strand-specific-matching" /> 87 <param name="strand_specific_matching" type="hidden" value="--strand-specific-matching" />
88 <param name="acceptor_donor_order_specific_matchig" type="hidden" value="--acceptor-donor-order-specific-matching" /> 88 <param name="acceptor_donor_order_specific_matchig" type="hidden" value="--acceptor-donor-order-specific-matching" />
89 </when> 89 </when>
90 <when value="full"> 90 <when value="full">
91 <param name="matching_method" type="select" label="Matching method: technique used to match fusion genes based on annotated gene sets" help="Overlap is the most sensitive but also more sensitive for long gene artefacts; subset is the recommended technique and EGM is conservative."> 91 <param name="matching_method" type="select" label="Matching method: technique used to match fusion genes based on annotated gene sets" help="Overlap is the most sensitive but also more sensitive for long gene artefacts; subset is the recommended technique and EGM is conservative">
92 <option value="overlap">Overlap</option> 92 <option value="overlap">Overlap</option>
93 <option value="subset" selected="True">Subset</option> 93 <option value="subset" selected="True">Subset</option>
94 <option value="egm">Exact Geneset Matching (EGM)</option> 94 <option value="egm">Exact Geneset Matching (EGM)</option>
95 </param> 95 </param>
96 96
97 <param name="strand_specific_matching" type="boolean" checked="True" truevalue="--strand-specific-matching" falsevalue="" label="Consider fusion genes distinct when the breakpoints have different strands" help="Only a limited number of file formats support this feature." /> 97 <param name="strand_specific_matching" type="boolean" checked="True"
98 <param name="acceptor_donor_order_specific_matchig" type="boolean" checked="True" truevalue="--acceptor-donor-order-specific-matching" falsevalue="" label="Consider fusion genes distinct when the donor and acceptor sites are swapped (A,B) != (B,A)" help="This settings is not recommended when fusion genes detected in DNA-Seq are used" /> 98 truevalue="--strand-specific-matching"
99 falsevalue="--no-strand-specific-matching"
100 label="Consider fusion genes distinct when the breakpoints have different strands: (A&lt;-,B&lt;-) != (-&gt;A,B&lt;-); default"
101 help="Only a limited number of file formats support this feature" />
102 <param name="acceptor_donor_order_specific_matchig" type="boolean" checked="False"
103 truevalue="--acceptor-donor-order-specific-matching"
104 falsevalue="--no-acceptor-donor-order-specific-matching"
105 label="Consider fusion genes distinct when the donor and acceptor sites are swapped (A,B) != (B,A)"
106 help="This settings is not recommended when fusion genes detected in DNA-Seq are used" />
99 107
100 <param name="output_format" type="select" label="Output format"> 108 <param name="output_format" type="select" label="Output format">
101 <option value="list_boolean" selected="true">List (Boolean)</option> 109 <option value="list_boolean" selected="true">List (Boolean)</option>
102 <option value="list">List</option> 110 <option value="list">List</option>
103 <option value="summary">Count summary</option> 111 <option value="summary">Count summary</option>
165 <!-- </repeat> --> 173 <!-- </repeat> -->
166 174
167 <param name="settingsType" value="full" /> 175 <param name="settingsType" value="full" />
168 176
169 <param name="matching_method" value="subset" /> 177 <param name="matching_method" value="subset" />
170 <param name="strand_specific_matching" value="" /> 178 <param name="strand_specific_matching" value="False" /><!-- Set to false, automatically sets the false value -->
171 <param name="acceptor_donor_order_specific_matchig" value="" /> 179 <param name="acceptor_donor_order_specific_matchig" value="False" /><!-- Set to false, automatically sets the false value -->
172 <param name="output_format" value="list_boolean" /> 180 <param name="output_format" value="list_boolean" />
173 181
174 <output name="fuma_overview" file="edgren_test_02_unspecifc_matching_output.txt" /> 182 <output name="fuma_overview" file="edgren_test_02_unspecifc_matching_output.txt" />
175 </test> 183 </test>
176 </tests> 184 </tests>
178 <help><![CDATA[ 186 <help><![CDATA[
179 ============ 187 ============
180 Introduction 188 Introduction
181 ============ 189 ============
182 190
183 FuMa (Fusion Matcher) matches predicted fusion events (both genomic and transcriptomic) according to chromosomal location or assocatiated gene annotation(s) where the latter should be genome build inspecific. 191 A new generation of tools that identify fusion genes in RNA-seq data is limited in either sensitivity and or specificity. To allow further downstream analysis and to estimate performance, predicted fusion genes from different tools have to be compared. However, the transcriptomic context complicates genomic location-based matching. FusionMatcher (FuMa) is a program that reports identical fusion genes based on gene-name annotations. FuMa automatically compares and summarizes all combinations of two or more datasets in a single run, without additional programming necessary. FuMa uses one gene annotation, avoiding mismatches caused by tool specific gene annotations. FuMa matches 10% more fusion genes compared to exact gene matching (EGM) due to overlapping genes and accepts intermediate output files that allow a step wise analysis of corresponding tools.
184
185 Because RNA-Sequencing deals with samples that may have undergrond splicing, reads may split up because of biological processes. If a fusion event takes place, the same thing may happen. Therefore we hypothesize that using spanning read distances may be unreliable, because there are known introns of > 100kb. Therefore, FuMa translates the breakpoint to gene names, and only overlaps breakpoints with the same genename(s).
186 192
187 ===== 193 =====
188 Usage 194 Usage
189 ===== 195 =====
190 196
238 244
239 ]]></help> 245 ]]></help>
240 246
241 <citations> 247 <citations>
242 <citation type="bibtex"> 248 <citation type="bibtex">
243 @unpublished{fuma, 249 @article{fuma,
244 author = {Youri Hoogstrate}, 250 author = { Hoogstrate, Youri and Böttcher, René and Hiltemann, Saskia and van der Spek, Peter J. and Stubbs, Andrew P. },
245 title = {FuMa: reporting overlap in RNA-seq detected fusion genes}, 251 title = {FuMa: reporting overlap in RNA-seq detected fusion genes},
246 url = { https://github.com/yhoogstrate/fuma } 252 url = { https://github.com/yhoogstrate/fuma }
247 } 253 }
248 </citation> 254 </citation>
249 </citations> 255 </citations>