annotate fasta_affixer.xml @ 12:6b7d31026d1c draft

Uploaded
author petr-novak
date Tue, 04 Feb 2020 08:38:22 -0500
parents c2c69c6090f0
children 58807b35777a
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
1 <tool id="fasta_affixer" name="FASTA read name affixer" version="1.0.0">
9
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
2 <description> Appending suffix and prefix to the read names </description>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
3 <command interpreter="python3">
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
4 fasta_affixer.py -f $input -p "$prefix" -s "$suffix" -n $nspace -o $output
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
5 </command>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
6
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
7 <inputs>
9
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
8 <param format="fasta" type="data" name="input" label="Choose your FASTA file" />
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
9 <param name="prefix" type="text" size="10" value="" label="Prefix" help="Enter prefix which will be added to all read names" />
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
10 <param name="suffix" type="text" size="10" value="" label="Suffix" help="Enter suffix which will be added to all read names"/>
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
11 <param name="nspace" type="integer" size="10" value="0" min="0" max="1000" label="Number of spaces in the name to ignore" help="By default, a string before the first space is considered to be the read name, and all characters following the space are discarded. If you want to keep the information following the space(s) in the name, enter positive integer."/>
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
12 </inputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
13
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
14
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
15 <outputs>
9
c2c69c6090f0 Uploaded
petr-novak
parents: 0
diff changeset
16 <data format="fasta" name="output" label="FASTA dataset ${input.hid} with modified sequence names" />
0
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
17 </outputs>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
18
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
19 <tests>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
20 <test>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
21 <param name="input" value="single_output.fasta" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
22 <param name="prefix" value="TEST" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
23 <param name="suffux" value="OK"/>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
24 <param name="nspace" value="0" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
25 <output name="output" value="prefix_suffix.fasta" />
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
26 </test>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
27 </tests>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
28 <help>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
29 **What is does**
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
30
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
31 Tool for appending prefix and suffix to sequences names in fasta formated sequences. This tool is useful
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
32 if you want to do comparative analysis with RepeatExplorer and need to
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
33 append sample codes to sequence identifiers
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
34
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
35 **Example**
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
36 The following fasta file:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
37
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
38 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
39
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
40 >123454
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
41 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
42 >234235
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
43 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
44
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
45 is renamed to:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
46
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
47 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
48
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
49 >prefix123454suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
50 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
51 >prefix234235suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
52 acgtactgactagccatgacg
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
53
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
54
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
55 By default, anything after spaces is
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
56 excluded from sequences name. In example sequence:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
57
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
58 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
59
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
60 >SRR352150.23846180 HWUSI-EAS1786:7:119:15910:19280/1
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
61 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
62 IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIGIIIHIIIIIFIIIIIIHDHBBIHFIHIIBHHDDHIFHIHIIIHIHGGDFDEI@EGEGFGFEFB@ECG
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
63
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
64 when **Number of spaces in name to ignore** is set to 0 (default) the output will be:
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
65
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
66 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
67
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
68 >prefixSRR352150.23846180suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
69 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
70
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
71
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
72 If you want to keep spaces the setting **Number of spaces in name to ignore** to 1 will yield
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
73
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
74 ::
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
75
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
76 >prefixSRR352150.23846180 HWUSI-EAS1786:7:119:15910:19280/1suffix
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
77 CTGGATTCTATACCTTTGGCAACTACTTCTTGGTTGATCAGGAAATTAACACTAGTAGTTTAGGCAATTTGGAATGGTGCCAAAGATGTATAGAACTTTC
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
78
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
79
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
80 </help>
a4cd8608ef6b Uploaded
petr-novak
parents:
diff changeset
81 </tool>