comparison POGs.xml @ 0:7bee3426a442 draft default tip

planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 3c7982d775b6f3b472f6514d791edcb43cd258a1-dirty
author abims-sbr
date Fri, 01 Feb 2019 10:24:29 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:7bee3426a442
1 <tool name="POGs" id="POGs" version="2.0.1">
2
3 <description>
4 Find orthologous groups
5 </description>
6
7 <macros>
8 <import>macros.xml</import>
9 </macros>
10
11 <requirements>
12 <expand macro="python_required" />
13 <requirement type="package" version="0.20.0">pandas</requirement>
14 <requirement type="package" version="1.12.0">numpy</requirement>
15 </requirements>
16
17 <command>
18 <![CDATA[
19 #set $infiles_from_paiwise_dna = ""
20 #for $input_from_paiwise_dna in $inputs_from_paiwise_dna
21 ln -s '$input_from_paiwise_dna' '$input_from_paiwise_dna.element_identifier';
22 #set $infiles_from_paiwise_dna = $infiles_from_paiwise_dna + $input_from_paiwise_dna.element_identifier + ","
23 #end for
24 #set $infiles_from_paiwise_dna = $infiles_from_paiwise_dna[:-1]
25
26 python '$__tool_directory__/scripts/pogs.py' '$infiles_from_paiwise_dna' '$minspec'
27
28 #if $verbose=="T":
29 -v
30 #end if
31 #if $paralogs=="T":
32 -p
33 #end if
34
35 > ${log}
36
37 ]]>
38 </command>
39
40 <inputs>
41 <param name="inputs_from_paiwise_dna" type="data" format="fasta" multiple="true" label="Input files from Pairwise DNA" />
42 <param name="minspec" type="integer" value="3" label="Drop orthogroups with less than n species" />
43 <param name="verbose" type="boolean" checked="True" truevalue="T" falsevalue="F" label="Verbose" help="Display a summary table of orthogroups before paralogs filtering"/>
44 <param name="paralogs" type="boolean" checked="False" truevalue="T" falsevalue="F" label="Paralogs" help="Return also orthogroups without paralogs filtering"/>
45 </inputs>
46
47 <outputs>
48 <data format="txt" name="log" label="pogs.output" />
49 <collection name="output" type="list" label="POGs_unaligned">
50 <discover_datasets pattern="__name_and_ext__" directory="outputs" />
51 </collection>
52 <collection name="outputPara" type="list" label="POGs_withParalogs_unaligned">
53 <discover_datasets pattern="__name_and_ext__" directory="outputs_withParalogs" />
54 <filter>paralogs == True</filter>
55 </collection>
56 </outputs>
57
58 <tests>
59 <test>
60 <param name="inputs_from_paiwise_dna" ftype="fasta" value="output_pairwise/RBH_AmAmphi_AcAcaud.fasta,output_pairwise/RBH_ApApomp_AcAcaud.fasta,output_pairwise/RBH_ApApomp_AmAmphi.fasta,output_pairwise/RBH_TeTerlap_AcAcaud.fasta,output_pairwise/RBH_TeTerlap_AmAmphi.fasta,output_pairwise/RBH_TeTerlap_ApApomp.fasta"/>
61 <param name="minspec" value="3"/>
62 <param name="verbose" value="True"/>
63 <param name="paralogs" value="True"/>
64 <output name="log" value="pogs.output" />
65 <output_collection name="output" type="list">
66 <element name="orthogroup_1_with_4_sequences" value="outputs/orthogroup_1_with_4_sequences.fasta" />
67 <element name="orthogroup_2_with_4_sequences" value="outputs/orthogroup_2_with_4_sequences.fasta" />
68 <element name="orthogroup_3_with_3_sequences" value="outputs/orthogroup_3_with_3_sequences.fasta" />
69 <element name="orthogroup_4_with_4_sequences" value="outputs/orthogroup_4_with_4_sequences.fasta" />
70 <element name="orthogroup_5_with_3_sequences" value="outputs/orthogroup_5_with_3_sequences.fasta" />
71 <element name="orthogroup_6_with_4_sequences" value="outputs/orthogroup_6_with_4_sequences.fasta" />
72 <element name="orthogroup_7_with_3_sequences" value="outputs/orthogroup_7_with_3_sequences.fasta" />
73 <element name="orthogroup_8_with_3_sequences" value="outputs/orthogroup_8_with_3_sequences.fasta" />
74 <element name="orthogroup_9_with_3_sequences" value="outputs/orthogroup_9_with_3_sequences.fasta" />
75 <element name="orthogroup_10_with_3_sequences" value="outputs/orthogroup_10_with_3_sequences.fasta" />
76 </output_collection>
77 <output_collection name="outputPara" type="list">
78 <element name="orthogroup_1_with_13_sequences_withParalogs" value="outputs_withParalogs/orthogroup_1_with_13_sequences_withParalogs.fasta" />
79 <element name="orthogroup_2_with_7_sequences_withParalogs" value="outputs_withParalogs/orthogroup_2_with_7_sequences_withParalogs.fasta" />
80 <element name="orthogroup_3_with_3_sequences_withParalogs" value="outputs_withParalogs/orthogroup_3_with_3_sequences_withParalogs.fasta" />
81 <element name="orthogroup_4_with_7_sequences_withParalogs" value="outputs_withParalogs/orthogroup_4_with_7_sequences_withParalogs.fasta" />
82 <element name="orthogroup_5_with_3_sequences_withParalogs" value="outputs_withParalogs/orthogroup_5_with_3_sequences_withParalogs.fasta" />
83 <element name="orthogroup_6_with_4_sequences_withParalogs" value="outputs_withParalogs/orthogroup_6_with_4_sequences_withParalogs.fasta" />
84 <element name="orthogroup_7_with_3_sequences_withParalogs" value="outputs_withParalogs/orthogroup_7_with_3_sequences_withParalogs.fasta" />
85 <element name="orthogroup_8_with_5_sequences_withParalogs" value="outputs_withParalogs/orthogroup_8_with_5_sequences_withParalogs.fasta" />
86 <element name="orthogroup_9_with_3_sequences_withParalogs" value="outputs_withParalogs/orthogroup_9_with_3_sequences_withParalogs.fasta" />
87 <element name="orthogroup_10_with_4_sequences_withParalogs" value="outputs_withParalogs/orthogroup_10_with_4_sequences_withParalogs.fasta" />
88 </output_collection>
89 </test>
90 <test>
91 <param name="inputs_from_paiwise_dna" ftype="fasta" value="output_pairwise/RBH_AmAmphi_AcAcaud.fasta,output_pairwise/RBH_ApApomp_AcAcaud.fasta,output_pairwise/RBH_ApApomp_AmAmphi.fasta,output_pairwise/RBH_TeTerlap_AcAcaud.fasta,output_pairwise/RBH_TeTerlap_AmAmphi.fasta,output_pairwise/RBH_TeTerlap_ApApomp.fasta"/>
92 <param name="minspec" value="3"/>
93 <param name="verbose" value="True"/>
94 <param name="paralogs" value="False"/>
95 <output name="log" value="2_pogs.output" />
96 <output_collection name="output" type="list">
97 <element name="orthogroup_1_with_4_sequences" value="outputs/orthogroup_1_with_4_sequences.fasta" />
98 <element name="orthogroup_2_with_4_sequences" value="outputs/orthogroup_2_with_4_sequences.fasta" />
99 <element name="orthogroup_3_with_3_sequences" value="outputs/orthogroup_3_with_3_sequences.fasta" />
100 <element name="orthogroup_4_with_4_sequences" value="outputs/orthogroup_4_with_4_sequences.fasta" />
101 <element name="orthogroup_5_with_3_sequences" value="outputs/orthogroup_5_with_3_sequences.fasta" />
102 <element name="orthogroup_6_with_4_sequences" value="outputs/orthogroup_6_with_4_sequences.fasta" />
103 <element name="orthogroup_7_with_3_sequences" value="outputs/orthogroup_7_with_3_sequences.fasta" />
104 <element name="orthogroup_8_with_3_sequences" value="outputs/orthogroup_8_with_3_sequences.fasta" />
105 <element name="orthogroup_9_with_3_sequences" value="outputs/orthogroup_9_with_3_sequences.fasta" />
106 <element name="orthogroup_10_with_3_sequences" value="outputs/orthogroup_10_with_3_sequences.fasta" />
107 </output_collection>
108 </test>
109 </tests>
110
111 <help>
112
113 @HELP_AUTHORS@
114
115 <![CDATA[
116
117 **Description**
118
119 This tool parses homologous sequences obtained by pairwise and gather sequences into groups of orthologous sequences.
120
121 --------
122
123 **Inputs**
124
125 The output of the tool 'Pairwise' (pairwise_DNA, nucleic format) (AdaptSearch suite), which consists in lists of homologous sequences between pairs of species obtained by RBH comparisons.
126
127 --------
128
129 **Parameters**
130
131 - Species minimum : drop orthogroups with less than n species : orthogroups with less than n species within won't be recorded.
132 - verbose : check 'Yes' if you want a supplementary table : countings of orthogroups before the paralogous sequences removal.
133 - paralogs : check 'Yes' if you also want to retrieve the orthogroups before the paralogous sequences removal.
134
135
136 .. class:: warningmark
137
138 The minimum number of species per group only applies to the main output files. In the case of the 'paralogs' option, this parameter is more likely the minimum amount of sequences to keep.
139
140 --------
141
142 **Outputs**
143
144 This tool, produces the following files :
145
146 - POGs : the general output, displaying countings tables of orthogroups.
147
148 - POGs_unaligned : a dataset collection which contains the groups of orthologous sequences (one group per file) in nucleic format, with paralogous sequences removed (only one sequence is kept per species and per group)
149
150 - POGs_withParalogs_unaligned : a similar dataset colelction in where paralogous sequences are kept. This output is available if you check 'Yes' to the 'paralogous' option.
151
152 ---------
153
154 **The AdaptSearch Pipeline**
155
156 .. image:: adaptsearch_picture_helps.png
157
158 ---------
159
160 Changelog
161 ---------
162
163 **Version 2.1 - 04/01/2018**
164
165 - Rewritten with improved results and better code
166 - Added options verbose and paralogs
167
168 **Version 2.0 - 11/07/2017**
169
170 - Replace the zip between tools by Dataset Collection
171 - Add option : paralogs filtering
172 - Added a second functional test (to test the new option)
173 - Code factoring
174 - Removed zip format of input and output files ; replaced by dataset collections
175
176
177 **Version 1.0 - 13/04/2017**
178
179 - TEST: Add funtional test with planemo
180 - IMPROVEMENT: Use conda dependencies for python
181
182 ]]>
183
184 </help>
185
186 </tool>