annotate fasta_affixer.xml @ 6:f224513123a1 draft

Uploaded
author petr-novak
date Mon, 02 Dec 2019 03:45:28 -0500
parents a4cd8608ef6b
children c2c69c6090f0
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
1 <tool id="fasta_affixer" name="FASTA read name affixer" version="1.0.0">
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
2 <description> Tool appending suffix and prefix to sequences names </description>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
3 <command interpreter="python3">
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
4 fasta_affixer.py -f $input -p "$prefix" -s "$suffix" -n $nspace -o $output
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
5 </command>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
6
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
7 <inputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
8 <param format="fasta" type="data" name="input" label="Choose your fasta file" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
9 <param name="prefix" type="text" size="10" value="" label="Prefix" help="Enter prefix which will be added to all sequences names" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
10 <param name="suffix" type="text" size="10" value="" label="Suffix" help="Enter suffix which will be added to all sequences names"/>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
11 <param name="nspace" type="integer" size="10" value="0" min="0" max="1000" label="Number of spaces in name to ignore" help="Sequence name is a string before the first space. If you want name to include spaces in name, enter positive integer. All other characters beyond ignored spaces are omitted"/>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
12 </inputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
13
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
14
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
15 <outputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
16 <data format="fasta" name="output" label="fasta dataset ${input.hid} with modified sequence names" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
17 </outputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
18
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
19 <tests>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
20 <test>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
21 <param name="input" value="single_output.fasta" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
22 <param name="prefix" value="TEST" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
23 <param name="suffux" value="OK"/>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
24 <param name="nspace" value="0" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
25 <output name="output" value="prefix_suffix.fasta" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
26 </test>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
27 </tests>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
28 <help>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
29 **What is does**
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
30
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
31 Tool for appending prefix and suffix to sequences names in fasta formated sequences. This tool is useful
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
32 if you want to do comparative analysis with RepeatExplorer and need to
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
33 append sample codes to sequence identifiers
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
34
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
35 **Example**
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
36 The following fasta file:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
37
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
38 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
39
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
40 >123454
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
41 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
42 >234235
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
43 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
44
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
45 is renamed to:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
46
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
47 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
48
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
49 >prefix123454suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
50 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
51 >prefix234235suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
52 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
53
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
54
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
55 By default, anything after spaces is
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
56 excluded from sequences name. In example sequence:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
57
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
58 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
59
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
60 >SRR352150.23846180 HWUSI-EAS1786:7:119:15910:19280/1
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
61 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
62 IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIGIIIHIIIIIFIIIIIIHDHBBIHFIHIIBHHDDHIFHIHIIIHIHGGDFDEI@EGEGFGFEFB@ECG
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
63
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
64 when **Number of spaces in name to ignore** is set to 0 (default) the output will be:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
65
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
66 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
67
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
68 >prefixSRR352150.23846180suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
69 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
70
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
71
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
72 If you want to keep spaces the setting **Number of spaces in name to ignore** to 1 will yield
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
73
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
74 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
75
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
76 >prefixSRR352150.23846180 HWUSI-EAS1786:7:119:15910:19280/1suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
77 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
78
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
79
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
80 </help>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
81 </tool>