comparison fasta2shrep_gspan.xml @ 0:b6e6830ff06b draft

planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust/GSPAN commit 21aaee40723b5341b4236edeb0e72995c2054053
author rnateam
date Fri, 16 Dec 2016 07:35:04 -0500
parents
children 358c52752305
comparison
equal deleted inserted replaced
-1:000000000000 0:b6e6830ff06b
1 <tool id="gspan" name="fasta_to_gspan" version="0.1">
2 <requirements>
3 <requirement type="package" version="0.1">graphclust-wrappers</requirement>
4 <requirement type="package" version="2.1.6">rnashapes</requirement>
5 </requirements>
6 <stdio>
7 <exit_code range="1:" />
8 </stdio>
9 <command>
10 <![CDATA[
11
12 'fasta2shrep_gspan.pl' --fasta '$dataFasta' $i_crop_unpaired_ends $i_abstr $i_stacks -t "3=0,5=80" -M $M -c $rel_energy_range -win $wins -shift $shift $u $seq_graph_t --group $group
13
14 ]]>
15 </command>
16 <inputs>
17 <param type="data" name="dataFasta" format="fasta" />
18 <param name="i_stacks" truevalue="-stack" falsevalue="" checked="True" type="boolean" label="Add stacking information to graphs." help="-stack"/>
19 <param name="i_abstr" truevalue="-abstr" falsevalue="" type="boolean" label="Add abstract structure graphs to the single shrep graph instances." help="-abstr"/>
20 <param name="i_crop_unpaired_ends" truevalue="-cue" falsevalue="" type="boolean" label="Add abstract structure graphs to the single shrep graph instances." help="-cue"/>
21 <param name="M" type="integer" value="5" size="7" label="Max number of shreps that should be taken per window." help="-M"/>
22 <param name="rel_energy_range" type="integer" value="20" size="7" label=" Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes)" help="-c"/>
23 <param name="wins" type="text" value="40,150" size="20" label=" A list of window sizes to use" help="comma separated integers"/>
24 <param name="shift" type="integer" value="30" size="7" label="The shift of the window, relative to the window size given inpercent." help="by default 30"/>
25 <param name="u" truevalue="-u" falsevalue="" checked="True" type="boolean" label="Ignore unstable structures (RNAshapes)" help="-u"/>
26 <param name="seq_graph_t" truevalue="--seq-graph-t" falsevalue="" checked="True" type="boolean" label="Add for each 't #' a graph which contains no structure" help="--seq-graph-t"/>
27 <param name="group" type="integer" value="10000" size="7" label="Group size." help="by default 10000"/>
28 </inputs>
29 <outputs>
30 <data name="gspan.zip" format="searchgui_archive" from_work_dir="GSPAN_Outputs/1.group.gspan.bz2" label="gspan zip" />
31 </outputs>
32 <tests>
33 <test>
34 <param name="dataFasta" value="data.fasta"/>
35 <output name="gspan.zip" file="GSPAN_Outputs/1.group.gspan.bz2" />
36 </test>
37 </tests>
38 <help>
39 <![CDATA[
40
41 **What it does**
42
43 For each fragment of input sequence we use RNAshapes to create a set of structures.
44 The default parameters for example consider for each input fragment again a
45 window of size 40nt and 150nt with a window shift of 30%. This allows to
46 consider local structures as well as global structures for a fragment.
47 From each such RNAshape window we take the top 5 shreps (suboptimal
48 structures for the top 5 shapes) within 20% of the mfe energy of that window
49 and convert them into graphs.
50 As shape level (abstraction level) we use 3 for short sequences and 5 for
51 sequences >= 80nt. Please see also RNAshapes documentation for all these
52 terms.
53
54
55 **Parameters**
56
57 + **input** : Sequences in Fasta format.
58
59 + **stack** : This adds an additional vertex (type P) for each pair of stacked base-pairs and four edges
60 (type p) from each of the involved bases to the new vertex.
61
62 + **abstr** : Add abstract structure graphs to the single shrep graph instances.
63
64 + **cue** : Crop unpaired ends. If you give this flag, then the unpaired ends of each single structure are ignored. E.g. the structure
65 ...(((...))).. becomes just (((...)))
66
67 + **M** : Max number of shreps that should be taken per window.
68
69 + **c** : Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes) Use only one of -e and -c!
70
71 + **wins** : A list of window sizes to use. If none are given (empty string ''), then the entire sequence is taken with no windows. Each window > 1 required!
72
73 + **shift** : The shift of the window, relative to the window size given in percent. So you give which percent of the window size shall be
74 used for the shift. Of course the shift is rounded down to the
75 nearest whole number.
76 Example 20 % of a window 150 would result in a step size of 30 nt.
77 It is a relative parameter, as you can give different window sizes.
78 If you do not give this parameter there is a default shift of 1 nt.
79
80 + **u** : Ignore unstable structures (RNAshapes). This option filters out closed structures with positive free energy.
81
82 + **seq-graph-t** : Add for each 't #' a graph which contains no structure
83
84 + **group** : Combine/group that number of input seqs into 1 gspan file output name is then '<INT>.group.gspan.bz2'
85
86 ]]>
87 </help>
88 <citations>
89 <citation type="doi">10.1093/bioinformatics/bts224</citation>
90 <citation type="bibtex">@article{jan:gie:2015,
91 author={Janssen, Stefan and Giegerich, Robert},
92 title={The RNA shapes studio},
93 journal={Bioinformatics},
94 year={2015},
95 doi={10.1093/bioinformatics/btu649},
96 url={http://bioinformatics.oxfordjournals.org/content/31/3/423.abstract}}</citation>
97 </citations>
98 </tool>