Mercurial > repos > abims-sbr > pairwise
comparison pairwise.xml @ 0:90b57ab0bd1d draft default tip
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
author | abims-sbr |
---|---|
date | Fri, 01 Feb 2019 10:23:16 -0500 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:90b57ab0bd1d |
---|---|
1 <tool name="Pairwise" id="pairwise" version="2.1.1"> | |
2 | |
3 <description> | |
4 Find homologous couples by blast with RBH | |
5 </description> | |
6 | |
7 <macros> | |
8 <import>macros.xml</import> | |
9 </macros> | |
10 | |
11 <requirements> | |
12 <expand macro="python_required" /> | |
13 <requirement type="package" version="1.65">biopython</requirement> | |
14 <requirement type="package" version="0.9.22">diamond</requirement> | |
15 <requirement type="package" version="2.2.22">blast-legacy</requirement> | |
16 </requirements> | |
17 | |
18 <command><![CDATA[ | |
19 #set $infiles = "" | |
20 #for $input in $inputs | |
21 ln -s '$input' '$input.element_identifier'; | |
22 #set $infiles = $infiles + $input.element_identifier + "," | |
23 #end for | |
24 #set $infiles = $infiles[:-1] | |
25 | |
26 ln -s $__tool_directory__/scripts/S02_04_keep_one_hit_from_blast.py . && | |
27 ln -s $__tool_directory__/scripts/S03_run_second_blast.py . && | |
28 ln -s $__tool_directory__/scripts/S05_find_rbh.py . && | |
29 | |
30 python -W ignore $__tool_directory__/scripts/S01_run_first_blast.py $infiles ${e_value} $method | |
31 > ${output}; | |
32 ]]></command> | |
33 | |
34 <inputs> | |
35 <param name="inputs" type="data" format="fasta" multiple="true" label="Input fasta files" /> | |
36 <param name="method" type="select" label="Alignment tool to use" help="tblastx is slow and sensitive, diamond is a lot quicker and less sensitive"> | |
37 <option value="tblastx">tblastx</option> | |
38 <option value="diamond">Diamond</option> | |
39 </param> | |
40 <param name="e_value" type="float" value="1e-5" label="e_value" help="e-value for blast." /> | |
41 </inputs> | |
42 | |
43 <outputs> | |
44 <data format="txt" name="output" label="Pairwise" /> | |
45 <collection name="output_fasta_dna" type="list" label="Pairwise_DNA"> | |
46 <discover_datasets pattern="__name_and_ext__" directory="outputs_RBH_dna" /> | |
47 </collection> | |
48 </outputs> | |
49 | |
50 <tests> | |
51 <test> | |
52 <param name="inputs" ftype="fasta" value="inputs_tblastx/AcAcaud_trinity.fasta,inputs_tblastx/AmAmphi_trinity.fasta,inputs_tblastx/ApApomp_trinity.fasta,inputs_tblastx/PfPfiji_trinity.fasta" /> | |
53 <param name="e-value" value="1e-5" /> | |
54 <param name="method" value="tblastx" /> | |
55 <output_collection name="output_fasta_dna" type="list"> | |
56 <element name="RBH_AcAcaud_AmAmphi_dna"> | |
57 <assert_contents> | |
58 <has_text text=">Ac5_1/1_1.000_160"/> | |
59 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCA"/> | |
60 <has_text text=">Am1_1/1_1.000_160"/> | |
61 <has_text text=">Ac7_1/1_1.000_160"/> | |
62 <has_text text="GCACCTAGAATTACCCGAAGTTGCTTGGCAATAGCGACACCTAACGGTCGCCATGATATTTGCAGGAAGAAGG"/> | |
63 <has_text text=">Am3_1/1_1.000_160"/> | |
64 <has_text text=">Ac6_1/1_1.000_160"/> | |
65 <has_text text="CAGCCTACCACTGAGAAGAGATACTTCAACATGTCTTACTGGGGTAGAAGTGGTGGTCGTACAGCGGGTGGTA"/> | |
66 <has_text text=">Am2_1/1_1.000_160"/> | |
67 </assert_contents> | |
68 </element> | |
69 <element name="RBH_AcAcaud_PfPfiji_dna"> | |
70 <assert_contents> | |
71 <has_text text=">Ac8_1/1_1.000_160"/> | |
72 <has_text text="ATCAAAGAAGAGCAACATCGAGCTACTGGCACTGGCAATGGAATCCTAATTATAGCAGAAACAAGCACTGGTTG"/> | |
73 <has_text text=">Pf8_1/1_1.000_160"/> | |
74 <has_text text=">Ac5_1/1_1.000_160"/> | |
75 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCAC"/> | |
76 <has_text text=">Pf7_1/1_1.000_160"/> | |
77 </assert_contents> | |
78 </element> | |
79 <element name="RBH_ApApomp_PfPfiji_dna"> | |
80 <assert_contents> | |
81 <has_text text=">Ap2_1/1_1.000_160"/> | |
82 <has_text text="ATACTCAGGCACACAGCATTTGTCGTACTAGGCGAGAGAGAGAGAGGAACGACTAATTGCAACCACGATTA"/> | |
83 <has_text text=">Pf5_1/1_1.000_160"/> | |
84 <has_text text=">Ap1_1/1_1.000_160"/> | |
85 <has_text text="GGTCGCCTTATAAAAACCAATCCGAAACAGTTTTCCTTTGAAACGTGCCAAAAACCAAAAACATACTTCAA"/> | |
86 <has_text text=">Pf4_1/1_1.000_160"/> | |
87 <has_text text=">Ap4_1/1_1.000_135"/> | |
88 <has_text text="CGGCCGCGGCGCGTCGTTCTCAGCCAAGCTGACTTCGACTTGAGCCGTCCATTCGCTTATTTACACGACGA"/> | |
89 <has_text text=">Pf10_1/1_1.000_160"/> | |
90 <has_text text=">Ap3_1/1_1.000_160"/> | |
91 <has_text text="GCCATGCAGTACACTGGACTTCTGTTATTCTGTTTGTTTGCCTTGACGGCAGCCAAACCCGCGGAAGACCT"/> | |
92 <has_text text=">Pf6_1/1_1.000_160"/> | |
93 </assert_contents> | |
94 </element> | |
95 <element name="RBH_AmAmphi_PfPfiji_dna"> | |
96 <assert_contents> | |
97 <has_text text=">Am8_1/1_1.000_160"/> | |
98 <has_text text="GTATTAATAAAAGGACAAGACTATTATTTAATACCAAGAAATCTGGCCTTAATAAGCATGGTTGCTTATATCAT"/> | |
99 <has_text text=">Pf9_1/1_1.000_160"/> | |
100 <has_text text=">Am1_1/1_1.000_160"/> | |
101 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCA"/> | |
102 <has_text text=">Pf7_1/1_1.000_160"/> | |
103 </assert_contents> | |
104 </element> | |
105 </output_collection> | |
106 </test> | |
107 | |
108 <test> | |
109 <param name="inputs" ftype="fasta" value="inputs_diamond/AcAcaud_Trinity.fasta,inputs_diamond/AmAmphi_Trinity.fasta,inputs_diamond/ApApomp_Trinity.fasta,inputs_diamond/PfPfiji_Trinity.fasta" /> | |
110 <param name="e-value" value="1e-5" /> | |
111 <param name="method" value="diamond" /> | |
112 <output_collection name="output_fasta_dna" type="list"> | |
113 <element name="RBH_AcAcaud_AmAmphi_dna"> | |
114 <assert_contents> | |
115 <has_text text=">Ac5_1/1_1.000_160"/> | |
116 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCA"/> | |
117 <has_text text=">Am1_1/1_1.000_160"/> | |
118 <has_text text=">Ac7_1/1_1.000_160"/> | |
119 <has_text text="GCACCTAGAATTACCCGAAGTTGCTTGGCAATAGCGACACCTAACGGTCGCCATGATATTTGCAGGAAGAAGG"/> | |
120 <has_text text=">Am3_1/1_1.000_160"/> | |
121 <has_text text=">Ac6_1/1_1.000_160"/> | |
122 <has_text text="CAGCCTACCACTGAGAAGAGATACTTCAACATGTCTTACTGGGGTAGAAGTGGTGGTCGTACAGCGGGTGGTA"/> | |
123 <has_text text=">Am2_1/1_1.000_160"/> | |
124 </assert_contents> | |
125 </element> | |
126 <element name="RBH_AcAcaud_ApApomp_dna"> | |
127 <assert_contents> | |
128 <has_text text=">Ac23_1/1_1.000_366"/> | |
129 <has_text text="ACTGAGGCTCGAACACAACAAAAAGGTGATGAGCAGTCAGCACTTAATAGAATATTACAGCAAGTAGCCAGTAA"/> | |
130 <has_text text=">Ap46_1/1_1.000_217"/> | |
131 <has_text text="CCACAACCAAGTGGCGGGTATAACAGCACCGAGGCTCGAACACAGCAAAAAGGTGATGAGCAGTCAGCTCTTAA"/> | |
132 </assert_contents> | |
133 </element> | |
134 <element name="RBH_AcAcaud_PfPfiji_dna"> | |
135 <assert_contents> | |
136 <has_text text=">Ac8_1/1_1.000_160"/> | |
137 <has_text text="ATCAAAGAAGAGCAACATCGAGCTACTGGCACTGGCAATGGAATCCTAATTATAGCAGAAACAAGCACTGGTTG"/> | |
138 <has_text text=">Pf8_1/1_1.000_160"/> | |
139 <has_text text=">Ac5_1/1_1.000_160"/> | |
140 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCAC"/> | |
141 <has_text text=">Pf7_1/1_1.000_160"/> | |
142 </assert_contents> | |
143 </element> | |
144 <element name="RBH_AmAmphi_PfPfiji_dna"> | |
145 <assert_contents> | |
146 <has_text text=">Am8_1/1_1.000_160"/> | |
147 <has_text text="GTATTAATAAAAGGACAAGACTATTATTTAATACCAAGAAATCTGGCCTTAATAAGCATGGTTGCTTATATCAT"/> | |
148 <has_text text=">Pf9_1/1_1.000_160"/> | |
149 <has_text text=">Am1_1/1_1.000_160"/> | |
150 <has_text text="GCACCGGGATGCGGATTTGCTGACGATATGGCAAAAGCATTGTCAGCGTGCGGAACCTGTTTATGTCACACCA"/> | |
151 <has_text text=">Pf7_1/1_1.000_160"/> | |
152 </assert_contents> | |
153 </element> | |
154 <element name="RBH_ApApomp_PfPfiji_dna"> | |
155 <assert_contents> | |
156 <has_text text=">Ap2_1/1_1.000_160"/> | |
157 <has_text text="ATACTCAGGCACACAGCATTTGTCGTACTAGGCGAGAGAGAGAGAGGAACGACTAATTGCAACCACGATTA"/> | |
158 <has_text text=">Pf5_1/1_1.000_160"/> | |
159 <!-- | |
160 <has_text text=">Ap1_1/1_1.000_160"/> | |
161 <has_text text="GGTCGCCTTATAAAAACCAATCCGAAACAGTTTTCCTTTGAAACGTGCCAAAAACCAAAAACATACTTCAA"/> | |
162 <has_text text=">Pf4_1/1_1.000_160"/> | |
163 <has_text text=">Ap4_1/1_1.000_160"/> | |
164 <has_text text="CGGCCGCGGCGCGTCGTTCTCAGCCAAGCTGACTTCGACTTGAGCCGTCCATTCGCTTATTTACACGACGA"/> | |
165 <has_text text=">Pf10_1/1_1.000_160"/> | |
166 <has_text text=">Ap3_1/1_1.000_160"/> | |
167 <has_text text="GCCATGCAGTACACTGGACTTCTGTTATTCTGTTTGTTTGCCTTGACGGCAGCCAAACCCGCGGAAGACCT"/> | |
168 <has_text text=">Pf6_1/1_1.000_160"/> | |
169 --> | |
170 </assert_contents> | |
171 </element> | |
172 </output_collection> | |
173 </test> | |
174 </tests> | |
175 | |
176 <help> | |
177 | |
178 @HELP_AUTHORS@ | |
179 | |
180 <![CDATA[ | |
181 | |
182 **Description** | |
183 | |
184 This tool searches for different homologous genes from pairwise comparisons between a set of fasta files (one file per species). | |
185 | |
186 -------- | |
187 | |
188 **Parameters** | |
189 | |
190 - 'Input files' : a collection of fasta files (one file per species) | |
191 - 'e_value' : the blast e-value. By default it's 1e-5. | |
192 - 'Alignment tool' : choose the sequences alignment tool between tblastx and Diamond. tblastx is more sensitive and Diamond is much faster. | |
193 | |
194 -------- | |
195 | |
196 **Outputs** | |
197 | |
198 - 'Pairwise' : the general output. It gives the information about what the tool has done for each pairwise. | |
199 | |
200 - 'Pairwise_DNA' : the output which contains nucleic sequences (of the pairwise) that are homologous. The sequences are in nucleic format. There are one file per couple of species, and homologous pairs are written by sets of 4 lines : | |
201 | |
202 Exemple for two homologous pairs for the output file for species X/Y : | |
203 | |
204 | >Gene_A_species_X_homologous_to_Gene_B_species_Y | |
205 | Nucleic_sequence_from_filter_assemblies | |
206 | >Gene_B_species_Y_homologous_to_Gene_A_species_X | |
207 | Nucleic_sequence_from_filter_assemblies | |
208 | >Gene_C_species_X_homologous_to_Gene_D_species_Y | |
209 | Nucleic_sequence_from_filter_assemblies | |
210 | >Gene_D_species_Y_homologous_to_Gene_C_species_X | |
211 | Nucleic_sequence_from_filter_assemblies | |
212 | |
213 | |
214 -------- | |
215 | |
216 **The AdaptSearch Pipeline** | |
217 | |
218 .. image:: adaptsearch_picture_helps.png | |
219 | |
220 --------- | |
221 | |
222 Changelog | |
223 --------- | |
224 | |
225 **Version 2.1 - 03/07/2018** | |
226 | |
227 - Add the possibility to use Diamond instead of tblastx | |
228 | |
229 **Version 2.0 - 18/04/2017** | |
230 | |
231 - NEW: Replace the zip between tools by Dataset Collection | |
232 | |
233 | |
234 **Version 1.0 - 13/04/2017** | |
235 | |
236 - TEST: Add functional test with planemo | |
237 | |
238 - IMPROVEMENT: Use conda dependencies for blast, samtools and python | |
239 | |
240 ]]> | |
241 </help> | |
242 | |
243 </tool> |