comparison tree_qa.xml @ 0:dd51f61c2309 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/checkm commit 2a3b068a98bf0e913dc03e0d5c2182cfd102cf27
author iuc
date Fri, 29 Jul 2022 20:30:47 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:dd51f61c2309
1 <tool id="checkm_tree_qa" name="CheckM tree_qa" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
2 <description>
3 Assess phylogenetic markers in the genome tree
4 </description>
5 <macros>
6 <import>macros.xml</import>
7 <xml name="concatenated_tre">
8 <param name="concatenated_tre" type="data" format="phyloxml" label="Concatenated tree"/>
9 </xml>
10 </macros>
11 <expand macro="biotools"/>
12 <expand macro="requirements"/>
13 <expand macro="version"/>
14 <command detect_errors="exit_code"><![CDATA[
15 @HMM_MARKER_STATS_INPUTS@
16 mkdir 'inputs/storage/tree/' &&
17 #if $output.out_format != '5'
18 ln -s '$output.concatenated_tre' 'inputs/storage/tree/concatenated.tre' &&
19 #else
20 ln -s '$output.concatenated_fasta' 'inputs/storage/tree/concatenated.fasta' &&
21 #end if
22
23 checkm tree_qa
24 'inputs'
25 --out_format $output.out_format
26 --tab_table
27 --file 'output_file'
28 ]]></command>
29 <inputs>
30 <expand macro="hmm_marker_stats_inputs"/>
31 <conditional name="output">
32 <param argument="--out_format" type="select" label="Desired output">
33 <option value="1">Brief summary of genome tree placement</option>
34 <option value="2">Detailed summary of genome tree placement including lineage-specific statistics</option>
35 <option value="3">Genome tree in Newick format decorated with IMG genome ids</option>
36 <option value="4">Genome tree in Newick format decorated with taxonomy strings</option>
37 <option value="5">Multiple sequence alignment of reference genomes and bins</option>
38 </param>
39 <when value="1">
40 <expand macro="concatenated_tre"/>
41 </when>
42 <when value="2">
43 <expand macro="concatenated_tre"/>
44 </when>
45 <when value="3">
46 <expand macro="concatenated_tre"/>
47 </when>
48 <when value="4">
49 <expand macro="concatenated_tre"/>
50 </when>
51 <when value="5">
52 <param name="concatenated_fasta" type="data" format="phyloxml" label="Concatenated masked sequences"/>
53 </when>
54 </conditional>
55 </inputs>
56 <outputs>
57 <data name="output_f1" format="tabular" from_work_dir="output_file" label="${tool.name} on ${on_string}: Summary of genome tree placement">
58 <filter>output['out_format']=="1"</filter>
59 </data>
60 <data name="output_f2" format="tabular" from_work_dir="output_file" label="${tool.name} on ${on_string}: Summary of genome tree placement including lineage-specific statistics">
61 <filter>output['out_format']=="2"</filter>
62 </data>
63 <data name="output_f3" format="newick" from_work_dir="output_file" label="${tool.name} on ${on_string}: Genome tree decorated with IMG genome ids">
64 <filter>output['out_format']=="3"</filter>
65 </data>
66 <data name="output_f4" format="newick" from_work_dir="output_file" label="${tool.name} on ${on_string}: Genome tree decorated with taxonomy strings">
67 <filter>output['out_format']=="4"</filter>
68 </data>
69 <data name="output_f5" format="tabular" from_work_dir="output_file" label="${tool.name} on ${on_string}: Multiple sequence alignment of reference genomes and bins">
70 <filter>output['out_format']=="5"</filter>
71 </data>
72 </outputs>
73 <tests>
74 <test expect_num_outputs="1">
75 <param name="phylo_hmm_info" ftype="zip" value="phylo_hmm_info.pkl.gz"/>
76 <param name="bin_stats_tree" ftype="tabular" value="bin_stats.tree.tsv"/>
77 <param name="hmmer_tree">
78 <collection type="list">
79 <element name="637000110" ftype="txt" value="hmmer.tree.txt"/>
80 </collection>
81 </param>
82 <conditional name="output">
83 <param name="out_format" value="1"/>
84 <param name="concatenated_tre" ftype="phyloxml" value="concatenated.tre"/>
85 </conditional>
86 <output name="output_f1" ftype="tabular">
87 <assert_contents>
88 <has_text text="637000110"/>
89 <has_text text="k__Bacteria;p__Proteobacteria;c__Gammaproteobacteria"/>
90 <has_text text="# unique markers"/>
91 </assert_contents>
92 </output>
93 </test>
94 <test expect_num_outputs="1">
95 <param name="phylo_hmm_info" ftype="zip" value="phylo_hmm_info.pkl.gz"/>
96 <param name="bin_stats_tree" ftype="tabular" value="bin_stats.tree.tsv"/>
97 <param name="hmmer_tree">
98 <collection type="list">
99 <element name="637000110" ftype="txt" value="hmmer.tree.txt"/>
100 </collection>
101 </param>
102 <conditional name="output">
103 <param name="out_format" value="2"/>
104 <param name="concatenated_tre" ftype="phyloxml" value="concatenated.tre"/>
105 </conditional>
106 <output name="output_f2" ftype="tabular">
107 <assert_contents>
108 <has_text text="637000110"/>
109 <has_text text="# unique markers (of 43)"/>
110 <has_text text="UID5220"/>
111 </assert_contents>
112 </output>
113 </test>
114 <test expect_num_outputs="1">
115 <param name="phylo_hmm_info" ftype="zip" value="phylo_hmm_info.pkl.gz"/>
116 <param name="bin_stats_tree" ftype="tabular" value="bin_stats.tree.tsv"/>
117 <param name="hmmer_tree">
118 <collection type="list">
119 <element name="IMG_646564547" ftype="txt" value="hmmer.tree.txt"/>
120 </collection>
121 </param>
122 <conditional name="output">
123 <param name="out_format" value="3"/>
124 <param name="concatenated_tre" ftype="phyloxml" value="concatenated.tre"/>
125 </conditional>
126 <output name="output_f3" ftype="newick">
127 <assert_contents>
128 <has_text text="IMG_646564547"/>
129 <has_text text="UID7|f__Methanocaldococcaceae"/>
130 <has_text text="f__Archaeoglobaceae"/>
131 </assert_contents>
132 </output>
133 </test>
134 <test expect_num_outputs="1">
135 <param name="phylo_hmm_info" ftype="zip" value="phylo_hmm_info.pkl.gz"/>
136 <param name="bin_stats_tree" ftype="tabular" value="bin_stats.tree.tsv"/>
137 <param name="hmmer_tree">
138 <collection type="list">
139 <element name="637000110" ftype="txt" value="hmmer.tree.txt"/>
140 </collection>
141 </param>
142 <conditional name="output">
143 <param name="out_format" value="4"/>
144 <param name="concatenated_tre" ftype="phyloxml" value="concatenated.tre"/>
145 </conditional>
146 <output name="output_f4" ftype="newick">
147 <assert_contents>
148 <has_text text="IMG_646564547"/>
149 <has_text text="k__Archaea;p__Euryarchaeota"/>
150 </assert_contents>
151 </output>
152 </test>
153 <test expect_num_outputs="1">
154 <param name="phylo_hmm_info" ftype="zip" value="phylo_hmm_info.pkl.gz"/>
155 <param name="bin_stats_tree" ftype="tabular" value="bin_stats.tree.tsv"/>
156 <param name="hmmer_tree">
157 <collection type="list">
158 <element name="637000110" ftype="txt" value="hmmer.tree.txt"/>
159 </collection>
160 </param>
161 <conditional name="output">
162 <param name="out_format" value="5"/>
163 <param name="concatenated_fasta" ftype="fasta" value="concatenated.fasta"/>
164 </conditional>
165 <output name="output_f5" ftype="tabular">
166 <assert_contents>
167 <has_text text=">637000110"/>
168 <has_text text="-TVNQLVR"/>
169 </assert_contents>
170 </output>
171 </test>
172 </tests>
173 <help><![CDATA[
174 @HELP_HEADER@
175
176 This command assesses phylogenetic markers in the genome tree
177
178 Inputs
179 ======
180
181
182 Outputs
183 =======
184
185 Output in function of selection output format
186
187 1. brief summary of genome tree placement indicating the number of unique phylogenetically informative markers found, the number of markers found multiple times, and a taxon string indicating the placement of each bin within the genome tree
188 2. detailed summary of genome tree placement giving a more detailed indication of where each bin is within the genome tree, general characteristics about each bin (e.g., GC, genome size, coding density), and general characteristics about all reference genomes descendant from the parental node of each bin (e.g., mean and standard deviation of GC)
189 3. genome tree in Newick format decorated with IMG genome ids which can be used to examine the phylogenetic neighbours of each bin
190 4. genome tree in Newick format decorated with taxonomy strings which can be used to examine the phylogenetic neighbours of each bin
191 5. multiple sequence alignment of reference genomes and bins which can be used to infer a de novo genome tree
192
193
194 ]]></help>
195 <expand macro="citations"/>
196 </tool>