annotate preprocessing.xml @ 6:dff6a5a17221 draft

planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 4dd7269185f6fb9bdc007028007d6540f4cf057d
author rnateam
date Sat, 25 Mar 2017 16:53:38 -0400
parents e4bd880868b0
children 07ad2d77f28a
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
1 <tool id="preproc" name="Preprocessing" version="0.1">
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
2 <requirements>
6
dff6a5a17221 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 4dd7269185f6fb9bdc007028007d6540f4cf057d
rnateam
parents: 5
diff changeset
3 <requirement type="package" version="0.1.12">graphclust-wrappers</requirement>
0
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
4 </requirements>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
5 <stdio>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
6 <exit_code range="1:" />
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
7 </stdio>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
8 <command>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
9 <![CDATA[
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
10
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
11 'preprocessing.pl'
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
12 '$fastaFile' $max_length $in_winShift $min_seq_length
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
13
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
14 ]]>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
15 </command>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
16 <inputs>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
17 <param type="data" name="fastaFile" format="fasta" />
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
18 <param name="max_length" type="integer" value="10000" size="5" label="window size"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
19 <param name="in_winShift" type="integer" value="100" size="5" label="window shift in percent"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
20 <param name="min_seq_length" type="integer" value="5" size="5" label="minimum sequence length"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
21 </inputs>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
22
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
23 <outputs>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
24 <data name="data.fasta" format="fasta" from_work_dir="FASTA/data.fasta" label="data.fasta"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
25 <data name="data.map" format="txt" from_work_dir="FASTA/data.map" label="data.map"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
26 <data name="data.names" format="txt" from_work_dir="FASTA/data.names" label="data.names"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
27 <data name="data.fasta.scan" format="fasta" from_work_dir="FASTA/data.fasta.scan" label="data.fasta.scan"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
28 <data name="FASTA" format="zip" from_work_dir="FASTA.zip" label="FASTA.ZIP"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
29 </outputs>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
30
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
31
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
32 <tests>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
33 <test>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
34 <param name="fastaFile" value="input.fa"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
35 <param name="max_length" value="10000"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
36 <param name="in_winShift" value="100"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
37 <param name="min_seq_length" value="5"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
38 <output name="data.fasta" file="FASTA/data.fasta"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
39 <output name="data.map" file="FASTA/data.map" />
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
40 <output name="data.names" file="FASTA/data.names"/>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
41 <output name="data.fasta.scan" file="FASTA/data.fasta.scan" />
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
42 </test>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
43 </tests>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
44
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
45 <help>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
46 <![CDATA[
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
47
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
48 **What it does**
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
49
6
dff6a5a17221 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 4dd7269185f6fb9bdc007028007d6540f4cf057d
rnateam
parents: 5
diff changeset
50 The tool takes as input a set of sequences in Fasta format and creates the final input for GraphCLust based on given parameters.
0
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
51
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
52 **Parameters**
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
53
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
54 + **window size** : All input sequences are splitted into fragments of this length.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
55 The shift of the sliding window can be defined via option *window shift in percent*.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
56 This paramter reflects the expected length of signals to be found.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
57 Slightly larger windows are usually ok. Too small windows can disturb existing signals.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
58
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
59
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
60
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
61
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
62 + **window shift in percent** : Relative window size in % for window shift during input preprocessing.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
63 Please note that a small shift results in much more fragments for clustering. The benefit is that RNA
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
64 motifs/structures are not destroyed by arbitrary split points. Smaller
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
65 shifts usually increase the cluster quality. Too small shifts (<20) are not
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
66 recommended as a dense center is "polluted" by overlapping fragments and
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
67 no other occurences in the dataset can be found.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
68
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
69
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
70
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
71
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
72
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
73 + **minimum sequence length** : Minimal length of input sequences.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
74 Every input sequence below that length is ignored completely during clustering.
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
75
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
76
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
77 ]]></help>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
78
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
79
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
80 <citations>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
81 <citation type="doi">10.1093/bioinformatics/bts224</citation>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
82 </citations>
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
83
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
84
3eb088816194 planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 21aaee40723b5341b4236edeb0e72995c2054053
rnateam
parents:
diff changeset
85 </tool>