0
|
1 <tool id="noisy" name="Noisy" version="1.5.12.1">
|
|
2 <description>Cleaning aligned sequences</description>
|
|
3 <requirements>
|
|
4 <requirement type="package" version="1.5.12">noisy</requirement>
|
|
5 </requirements>
|
|
6 <command><![CDATA[
|
|
7 noisy $input
|
|
8
|
|
9 #if $sequence.seqtype == 'cfg' :
|
|
10 ## Automatic sequence detection
|
|
11 ## read an info file to choose which option set
|
|
12 #set $info = open( str($input_info) ).read()
|
|
13 #if 'dna' in $info:
|
|
14 --seqtype D
|
|
15 #else if 'protein' in $info :
|
|
16 --seqtype P
|
|
17 #end if
|
|
18
|
|
19 #else :
|
|
20 --seqtype $sequence.seqtype
|
|
21 #end if
|
|
22
|
|
23 --cutoff $cutoff
|
|
24 --distance $distance
|
|
25 #if $usematrix.matrix == "true":
|
|
26 --matrix $usematrix.matrixfile
|
|
27 #end if
|
|
28 #if $missingchar.setmissingchar == "true":
|
|
29 --missing $missingchar.chars
|
|
30 #end if
|
|
31 --ordering
|
|
32 #if $orderingmethode.ordering == "rand":
|
|
33 RAND[,$orderingmethode.randpermut]
|
|
34 #else if $orderingmethode.ordering == "list":
|
|
35 $orderingmethode.randpermutlist
|
|
36 #else:
|
|
37 $orderingmethode.ordering
|
|
38 #end if
|
|
39
|
|
40 $constant
|
|
41 $gap
|
|
42
|
|
43 --shuffles $shuffles
|
|
44 --smooth $smooth
|
|
45 --silent
|
|
46
|
|
47 ]]>
|
|
48 </command>
|
|
49 <inputs>
|
|
50 <param name="input" type="data" format="fasta" label="Source file" help="Fasta format" />
|
|
51 <conditional name="sequence">
|
|
52 <param name="seqtype" type="select" label="Sequence Coding">
|
|
53 <option value="D">DNA</option>
|
|
54 <option value="P">Protein</option>
|
|
55 <option value="R">RNA</option>
|
|
56 <option value="cfg">Config file</option>
|
|
57 </param>
|
|
58 <when value="D"></when>
|
|
59 <when value="P"></when>
|
|
60 <when value="R"></when>
|
1
|
61 <when value="cfg">
|
0
|
62 <param name="input_info" type="data" format="txt" label="info" help="Precompute file containning sequence description (dna or protein)" />
|
|
63 </when>
|
|
64 </conditional>
|
|
65 <param name="cutoff" type="float" value="0.8" min="0" max="1" label="cut-off [ 0-1 ]" help="Columns with a score below FLOAT are removed from the output alignment." />
|
|
66 <param name="distance" type="select" label="Distance methode used by NeighbotNet">
|
|
67 <option value="HAMMING">HAMMING</option>
|
|
68 <option value="GTR">GTR</option>
|
|
69 </param>
|
|
70 <conditional name="usematrix">
|
|
71 <param name="matrix" type="boolean" truevalue="true" falsevalue="" checked="False" label="Use matrix file" help="default is calculate distances with nnet"/>
|
|
72 <when value=""/>
|
|
73 <when value="true">
|
|
74 <param name="matrixfile" format="text" type="data" label="matrix file"/>
|
|
75 </when>
|
|
76 </conditional>
|
|
77 <conditional name="missingchar">
|
|
78 <param name="setmissingchar" type="boolean" truevalue="true" falsevalue="" checked="False" label="Set list of missing chars" />
|
|
79 <when value=""/>
|
|
80 <when value="true">
|
|
81 <param name="chars" type="text" label="Missing chars list"/>
|
|
82 </when>
|
|
83 </conditional>
|
|
84 <conditional name="orderingmethode">
|
|
85 <param name="ordering" type="select" display="radio" label="Choose ordering method">
|
|
86 <option value="nnet">NeighborNet</option>
|
|
87 <option value="qnet">QNet</option>
|
|
88 <option value="rand">Sample INT random permutation</option>
|
|
89 <option value="list">List of index MSA ordering</option>
|
|
90 <option value="all">All permutations</option>
|
|
91 </param>
|
|
92 <when value="nnet"/>
|
|
93 <when value="qnet"/>
|
|
94 <option value="all"/>
|
|
95 <when value="rand">
|
|
96 <param name="randpermut" type="integer" value="1000" label="random permutation"/>
|
|
97 </when>
|
|
98 <when value="list">
|
|
99 <param name="randpermutlist" type="text" label="Comma-seperated string of INT"/>
|
|
100 </when>
|
|
101 </conditional>
|
|
102 <param name="constant" type="boolean" truevalue="" falsevalue="--noconstant" checked="True" label="Constant columns in output alignment" />
|
|
103 <param name="gap" type="boolean" truevalue="" falsevalue="--nogap" checked="True" label="Count gap symbol as character state"/>
|
|
104 <param name="smooth" type="integer" value="1" min="0" max="1000" label="Running average over INT columns" help="Calculate a running average over the reliability score of INT columns and use this smoothed values to remove unreliable columns from the MAS.s" />
|
|
105 <param name="shuffles" type="integer" value="0" min="0" max="1000" label="Perform INT random shuffles per column of the MSA"/>
|
|
106 </inputs>
|
|
107 <outputs>
|
|
108 <data name="output1" format="fasta" label="Noisy Cleaned sequencies" from_work_dir="*_out.fas" />
|
|
109 <data name="output2" format="eps" label="Noisy Cleaned sequencies image" from_work_dir="*_typ.eps" />
|
|
110 <data name="output3" format="txt" label="Noisy Cleaned sequencies information" from_work_dir="*_sta.gr" />
|
|
111 </outputs>
|
|
112 <tests>
|
|
113 <test>
|
|
114 <param name="input" value="aln.fasta" />
|
|
115 <output name="output1" file="aln_out.fas" />
|
|
116 </test>
|
|
117 </tests>
|
|
118
|
|
119 <help>
|
|
120 <![CDATA[
|
|
121 Usage::
|
|
122
|
|
123 noisy [OPTIONS] MultiFastaAlignment
|
|
124
|
|
125 Options::
|
|
126
|
|
127 --cutoff FLOAT Set cutoff value to FLOAT. Columns with a score below FLOAT are removed from the output alignment.
|
|
128 (default is >0.80<)
|
|
129 --distance STRING Distance methode used by NeighbotNet.
|
|
130 (default is >HAMMING< [HAMMING|GTR])
|
|
131 -h, --help Print usage message for noisy.
|
|
132 --matrix FILE Use distance matrix for NeighbotNet from FILE.
|
|
133 (default is >calculate distances with nnet<)
|
|
134 --missing STRING Set list of missing characters to STRING.
|
|
135 (default is >N<)
|
|
136 --nogap Don't count gap symbol as character state.
|
|
137 (default is >0<)
|
|
138 --noconstant Ignore constant columns in output alignment.
|
|
139 (default is >0<)
|
|
140 --ordering STRING
|
|
141 Choose ordering method.
|
|
142 (default is >nnet<)
|
|
143 nnet NeighborNet
|
|
144 qnet QNet algorithm is O(n^4) both in time and memory, be careful when you use this option.
|
|
145 rand[,INT] sample INT random permutation. With rand a random sample of all possible orderings of the TAXA can be specified for which the reliability score is calculated
|
|
146 (default is >1000<)
|
|
147 INT,INT,... provide ordering explicitly as comma-seperated list of TAXA indices in the range (e.g 3,0,4,1,2 as ordering for the 5 TAXA in the input MSA).
|
|
148 all all permutations, If all is used than for all possible permutations of the TAXA the reliability score is calculated (Note that for more than 8 TAXA this can become rather time consuming!).
|
|
149
|
|
150 --shuffles INT Perform INT random shuffles per column.
|
|
151 (default is >0<)
|
|
152 -s, --silent Turn off status bar
|
|
153 (default is >0<)
|
|
154 --smooth INT Running avarage over INT columns.
|
|
155 (default is >1<)
|
|
156 --seqtype CHAR Set sequence type of input alignment to CHAR
|
|
157 (default is >D<) [D=DNA, P=Protein, R=RNA]
|
|
158 -v, --verbose Verbose mode. Causes noisy to print debugging
|
|
159 messages about its progress.
|
|
160 ]]>
|
|
161 </help>
|
|
162 <citations>
|
|
163 <citation type="doi">10.1186/1748-7188-3-7</citation>
|
|
164 <citation type="doi">10.1093/molbev/msl180</citation>
|
|
165 <citation type="doi">10.1093/molbev/msh018s</citation>
|
|
166 </citations>
|
|
167 </tool>
|