annotate removeFastaSubSequence.xml @ 0:9ec27561593e draft

planemo upload
author pravs
date Wed, 02 Aug 2017 18:09:53 -0400
parents
children d49328dfeceb
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9ec27561593e planemo upload
pravs
parents:
diff changeset
1
9ec27561593e planemo upload
pravs
parents:
diff changeset
2 <tool id="removeFastaSubSequence" name="Remove Fasta Substring Sequence" version="1.0.0">
9ec27561593e planemo upload
pravs
parents:
diff changeset
3 <description>Removes sequences that are subsequence in a reference Fasta File.</description>
9ec27561593e planemo upload
pravs
parents:
diff changeset
4 <requirements>
9ec27561593e planemo upload
pravs
parents:
diff changeset
5 <requirement type="package" version="1.70">biopython</requirement>
9ec27561593e planemo upload
pravs
parents:
diff changeset
6 </requirements>
9ec27561593e planemo upload
pravs
parents:
diff changeset
7 <command interpreter="python"><![CDATA[removeFastaSubSequence.py $ref_fastafile $query_fastafile $output]]></command>
9ec27561593e planemo upload
pravs
parents:
diff changeset
8 <inputs>
9ec27561593e planemo upload
pravs
parents:
diff changeset
9 <param name="ref_fastafile" type="data" format="fasta">
9ec27561593e planemo upload
pravs
parents:
diff changeset
10 <label>Input Reference Fasta File</label>
9ec27561593e planemo upload
pravs
parents:
diff changeset
11 </param>
9ec27561593e planemo upload
pravs
parents:
diff changeset
12 <param name="query_fastafile" type="data" format="fasta">
9ec27561593e planemo upload
pravs
parents:
diff changeset
13 <label>Input Query Fasta File</label>
9ec27561593e planemo upload
pravs
parents:
diff changeset
14 </param>
9ec27561593e planemo upload
pravs
parents:
diff changeset
15 </inputs>
9ec27561593e planemo upload
pravs
parents:
diff changeset
16
9ec27561593e planemo upload
pravs
parents:
diff changeset
17 <outputs>
9ec27561593e planemo upload
pravs
parents:
diff changeset
18 <data format="fasta" name="output" label="uniqSeq_${query_fastafile.name.rsplit('.',1)[0]}.fasta" />
9ec27561593e planemo upload
pravs
parents:
diff changeset
19 </outputs>
9ec27561593e planemo upload
pravs
parents:
diff changeset
20
9ec27561593e planemo upload
pravs
parents:
diff changeset
21 <tests>
9ec27561593e planemo upload
pravs
parents:
diff changeset
22 <test>
9ec27561593e planemo upload
pravs
parents:
diff changeset
23 <param name="ref_fastafile" value="test_ref.fasta" />
9ec27561593e planemo upload
pravs
parents:
diff changeset
24 <param name="query_fastafile" value="test_query.fasta" />
9ec27561593e planemo upload
pravs
parents:
diff changeset
25 <output name="output" file="uniqSeq_test_query.fasta">
9ec27561593e planemo upload
pravs
parents:
diff changeset
26 <assert_contents>
9ec27561593e planemo upload
pravs
parents:
diff changeset
27 <has_text text="ENSMUST00000193003" />
9ec27561593e planemo upload
pravs
parents:
diff changeset
28 </assert_contents>
9ec27561593e planemo upload
pravs
parents:
diff changeset
29 </output>
9ec27561593e planemo upload
pravs
parents:
diff changeset
30 </test>
9ec27561593e planemo upload
pravs
parents:
diff changeset
31 </tests>
9ec27561593e planemo upload
pravs
parents:
diff changeset
32
9ec27561593e planemo upload
pravs
parents:
diff changeset
33
9ec27561593e planemo upload
pravs
parents:
diff changeset
34 <help>
9ec27561593e planemo upload
pravs
parents:
diff changeset
35 This program removes the sequences from the query fasta file that are present as subsequence in a reference fasta file.
9ec27561593e planemo upload
pravs
parents:
diff changeset
36
9ec27561593e planemo upload
pravs
parents:
diff changeset
37 EXAMPLE:
9ec27561593e planemo upload
pravs
parents:
diff changeset
38
9ec27561593e planemo upload
pravs
parents:
diff changeset
39 ----
9ec27561593e planemo upload
pravs
parents:
diff changeset
40
9ec27561593e planemo upload
pravs
parents:
diff changeset
41 Ref sequences:
9ec27561593e planemo upload
pravs
parents:
diff changeset
42
9ec27561593e planemo upload
pravs
parents:
diff changeset
43 >reference_seq_1
9ec27561593e planemo upload
pravs
parents:
diff changeset
44
9ec27561593e planemo upload
pravs
parents:
diff changeset
45 TSLDKDHLELCCTLSLPFSWACSWVLVLRLSINGQLPRSRLWAAHCLWGVP
9ec27561593e planemo upload
pravs
parents:
diff changeset
46
9ec27561593e planemo upload
pravs
parents:
diff changeset
47 >reference_seq_2
9ec27561593e planemo upload
pravs
parents:
diff changeset
48
9ec27561593e planemo upload
pravs
parents:
diff changeset
49 RGLCISGLEKEVQVQSRQAEGPVHLWLRKGSTSAE
9ec27561593e planemo upload
pravs
parents:
diff changeset
50
9ec27561593e planemo upload
pravs
parents:
diff changeset
51 ----
9ec27561593e planemo upload
pravs
parents:
diff changeset
52
9ec27561593e planemo upload
pravs
parents:
diff changeset
53 Query Sequences:
9ec27561593e planemo upload
pravs
parents:
diff changeset
54
9ec27561593e planemo upload
pravs
parents:
diff changeset
55 >query_seq_1
9ec27561593e planemo upload
pravs
parents:
diff changeset
56
9ec27561593e planemo upload
pravs
parents:
diff changeset
57 TKTILNYAVLSPCLSPGHVLGC
9ec27561593e planemo upload
pravs
parents:
diff changeset
58
9ec27561593e planemo upload
pravs
parents:
diff changeset
59
9ec27561593e planemo upload
pravs
parents:
diff changeset
60 >query_seq_2
9ec27561593e planemo upload
pravs
parents:
diff changeset
61
9ec27561593e planemo upload
pravs
parents:
diff changeset
62 LDKDHLELCCTLSLPFSWACSWVLVL
9ec27561593e planemo upload
pravs
parents:
diff changeset
63
9ec27561593e planemo upload
pravs
parents:
diff changeset
64
9ec27561593e planemo upload
pravs
parents:
diff changeset
65 >query_seq_3
9ec27561593e planemo upload
pravs
parents:
diff changeset
66
9ec27561593e planemo upload
pravs
parents:
diff changeset
67 LWGVPRGLCISG
9ec27561593e planemo upload
pravs
parents:
diff changeset
68
9ec27561593e planemo upload
pravs
parents:
diff changeset
69 ----
9ec27561593e planemo upload
pravs
parents:
diff changeset
70
9ec27561593e planemo upload
pravs
parents:
diff changeset
71 Output Sequences:
9ec27561593e planemo upload
pravs
parents:
diff changeset
72
9ec27561593e planemo upload
pravs
parents:
diff changeset
73 >query_seq_1
9ec27561593e planemo upload
pravs
parents:
diff changeset
74
9ec27561593e planemo upload
pravs
parents:
diff changeset
75 TKTILNYAVLSPCLSPGHVLGC
9ec27561593e planemo upload
pravs
parents:
diff changeset
76
9ec27561593e planemo upload
pravs
parents:
diff changeset
77
9ec27561593e planemo upload
pravs
parents:
diff changeset
78 >query_seq_3
9ec27561593e planemo upload
pravs
parents:
diff changeset
79
9ec27561593e planemo upload
pravs
parents:
diff changeset
80 LWGVPRGLCISG
9ec27561593e planemo upload
pravs
parents:
diff changeset
81
9ec27561593e planemo upload
pravs
parents:
diff changeset
82 ----
9ec27561593e planemo upload
pravs
parents:
diff changeset
83
9ec27561593e planemo upload
pravs
parents:
diff changeset
84 Output Sequence file will have only query_seq_1 and query_seq_3. query_seq_2 is removed because query_seq_2's sequence "LDKDHLELCCTLSLPFSWACSWVLVL" is
9ec27561593e planemo upload
pravs
parents:
diff changeset
85 present as substring in reference_seq_1's sequence "TSLDKDHLELCCTLSLPFSWACSWVLVLRLSINGQLPRSRLWAAHCLWGVP".
9ec27561593e planemo upload
pravs
parents:
diff changeset
86
9ec27561593e planemo upload
pravs
parents:
diff changeset
87 </help>
9ec27561593e planemo upload
pravs
parents:
diff changeset
88 </tool>