comparison humann_regroup_table.xml @ 0:26ce946f4da9 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/humann commit 077b8f34e081e6c427acb0fde0fbb97d1b241e0b"
author iuc
date Wed, 12 May 2021 08:59:30 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:26ce946f4da9
1 <tool id="humann_regroup_table" name="Regroup" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
2 <description>HUMAnN table features</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="edam_ontology"/>
7 <expand macro="requirements"/>
8 <expand macro="version"/>
9 <command detect_errors="exit_code"><![CDATA[
10 humann_regroup_table
11 --input '$input'
12 --output '$output'
13 --function '$function'
14 #if $grouping.type == "standard"
15 --groups '$grouping.groups'
16 #else if $grouping.type == "large"
17 --custom '$grouping.grouping.fields.path'
18 $grouping.reversed
19 #else:
20 --custom '$grouping.custom'
21 $grouping.reversed
22 #end if
23 --precision $precision
24 --ungrouped '$ungrouped'
25 --protected '$protected'
26 ]]></command>
27 <inputs>
28 <param argument="--input" type="data" format="tsv,tabular" label="Gene families table"/>
29 <param argument="--function" type="select" label="How to combine grouped features?">
30 <option value="sum" selected="true">Sum</option>
31 <option value="mean">Mean</option>
32 </param>
33 <conditional name="grouping">
34 <param name="type" type="select" label="Grouping">
35 <option value="standard">Basic grouping (to MetaCyc pathways)</option>
36 <option value="large">Grouping with larger mapping</option>
37 <option value="custom">Grouping with custom mapping</option>
38 </param>
39 <when value="standard">
40 <param argument="--groups" type="select" label="Grouping">
41 <option value="uniref90_rxn">UniRef90 to MetaCyc pathways</option>
42 <option value="uniref50_rxn">UniRef50 to MetaCyc pathways</option>
43 </param>
44 </when>
45 <when value="large">
46 <param name="grouping" type="select" label="Mapping to use for the grouping">
47 <options from_data_table="humann_utility_mapping">
48 <validator message="No utility mapping is available" type="no_options" />
49 <filter type="regexp" column="0" value=".*map.*(?!_name)" keep="true"/>
50 </options>
51 </param>
52 <param argument="--reversed" type="boolean" checked="false" truevalue="--reversed" falsevalue="" label="Mapping from features to groups?"/>
53 </when>
54 <when value="custom">
55 <param argument="--custom" type="data" format="tsv,txt,tabular" label="Custom mapping file for grouping" help="The format is explained in the help"/>
56 <param argument="--reversed" type="boolean" checked="false" truevalue="--reversed" falsevalue="" label="Is the groups file reversed?" help="Mapping from features to groups"/>
57 </when>
58 </conditional>
59 <param argument="--precision" type="integer" value="3" label="Decimal places to round to after applying function"/>
60 <param argument="--ungrouped" type="boolean" checked="true" truevalue="Y" falsevalue="N" label="Include an 'UNGROUPED' group to capture features that did not belong to other groups?"/>
61 <param argument="--protected" type="boolean" checked="true" truevalue="Y" falsevalue="N" label="Carry through protected features, such as 'UNMAPPED'?"/>
62 </inputs>
63 <outputs>
64 <data name="output" format="tabular"/>
65 </outputs>
66 <tests>
67 <test expect_num_outputs="1">
68 <param name="input" value="demo_genefamilies.tsv"/>
69 <param name="function" value="sum"/>
70 <conditional name="grouping">
71 <param name="type" value="standard"/>
72 <param name="groups" value="uniref90_rxn"/>
73 </conditional>
74 <param name="precision" value="3"/>
75 <param name="ungrouped" value="Y"/>
76 <param name="protected" value="Y"/>
77 <output name="output" ftype="tabular">
78 <assert_contents>
79 <has_text text="2.5.1.19-RXN|g__Bacteroides.s__Bacteroides_vulgatus"/>
80 <has_text text="ACETYLGLUTKIN-RXN|g__Bacteroides.s__Bacteroides_vulgatus"/>
81 </assert_contents>
82 </output>
83 </test>
84 <test expect_num_outputs="1">
85 <param name="input" value="demo_genefamilies.tsv"/>
86 <param name="function" value="mean"/>
87 <conditional name="grouping">
88 <param name="type" value="large"/>
89 <param name="grouping" value="utility_mapping-full-map_go_uniref90-3.0.0-29042021"/>
90 </conditional>
91 <param name="precision" value="3"/>
92 <param name="ungrouped" value="Y"/>
93 <param name="protected" value="Y"/>
94 <output name="output" ftype="tabular">
95 <assert_contents>
96 <has_text text="GO:0000049|g__Bacteroides.s__Bacteroides_vulgatus" />
97 <has_text text="GO:0003866|g__Bacteroides.s__Bacteroides_vulgatus" />
98 </assert_contents>
99 </output>
100 </test>
101 <test expect_num_outputs="1">
102 <param name="input" value="demo_genefamilies.tsv"/>
103 <param name="function" value="sum"/>
104 <conditional name="grouping">
105 <param name="type" value="custom"/>
106 <!-- file generated using customizemapping file -->
107 <param name="custom" value="test-db/utility_mapping/map_go_uniref90.txt"/>
108 </conditional>
109 <param name="precision" value="3"/>
110 <param name="ungrouped" value="Y"/>
111 <param name="protected" value="Y"/>
112 <output name="output" ftype="tabular">
113 <assert_contents>
114 <has_text text="GO:0000049|g__Bacteroides.s__Bacteroides_vulgatus" />
115 <has_text text="GO:0003866|g__Bacteroides.s__Bacteroides_vulgatus" />
116 </assert_contents>
117 </output>
118 </test>
119 </tests>
120 <help><![CDATA[
121 @HELP_HEADER@
122
123 This tool takes a table of feature values and a mapping of groups to component features to produce
124 a new table with group values in place of feature values.
125
126 HUMAnN gene family output can contain a very large number of features depending on the complexity
127 of your underlying sample. One way to explore this information in a simplified manner is via HUMAnN's
128 own pathway coverage and abundance, which summarize the values of their member genes. However, this
129 approach does not apply to gene families that are not associated with metabolic pathways.
130
131 To further simplify the exploration of gene family abundance data, users can regroup gene families
132 into other functional categories using the current tool. This tool takes as arguments a gene
133 family abundance table and a mapping (groups) file that indicates which gene families belong to which
134 groups.
135
136 Out of the box, HUMAnN can regroup gene families to MetaCyc reactions (a step which is also
137 used internally as part of MetaCyc pathway quantification). Users can use additional mapping files
138 for both UniRef90 and UniRef50 gene families to the following systems:
139
140 - MetaCyc Reactions
141 - KEGG Orthogroups (KOs)
142 - Pfam domains
143 - Level-4 enzyme commission (EC) categories
144 - EggNOG (including COGs)
145 - Gene Ontology (GO)
146 - Informative GO
147
148 In most cases, mappings are directly inferred from the annotation of the corresponding UniRef centroid sequence in UniProt.
149
150 One exception to this are the "informative GO" (infogo1000) maps: These are informative subsets of GO computed from UniProt's
151 annotations and the structure of the GO hierarchy specifically for HUMAnN (each informative GO term has >1,000 UniRef centroids
152 annotated to it, but none of its progeny terms have >1,000 centroids so annotated).
153
154 If the "UNMAPPED" gene abundance feature is included in a user's input, it will automatically be carried forward to the final output.
155 In addition, genes that do not group with a non-trivial feature are combined as an "UNGROUPED" group. By default, UNGROUPED reflects
156 the total abundance of genes that did not belong to another group (similar in spirit to the "UNINTEGRATED" value reported in the pathway
157 abundance file).
158
159
160 Some groups are not associated by default with human-readable names. To attach names to a regrouped table, use the HUMAnN rename tool
161 (The "GO" name map can be used for both raw GO and informative GO.)
162
163 Inputs
164 ======
165
166 Users are free to create and use additional mapping files and pass them to this tool. The format of a mapping file is:
167
168 ``
169 group1 uniref1 uniref2 uniref3 ...
170 ``
171
172 ``
173 group2 uniref1 uniref5 ...
174 ``
175
176 Where spaces between items above denote TABS. By default, feature abundances (such as gene families) are summed to produce group abundances.
177
178
179
180 ]]></help>
181 <expand macro="citations"/>
182 </tool>