Mercurial > repos > iuc > humann_regroup_table
comparison humann_regroup_table.xml @ 0:26ce946f4da9 draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/humann commit 077b8f34e081e6c427acb0fde0fbb97d1b241e0b"
author | iuc |
---|---|
date | Wed, 12 May 2021 08:59:30 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:26ce946f4da9 |
---|---|
1 <tool id="humann_regroup_table" name="Regroup" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> | |
2 <description>HUMAnN table features</description> | |
3 <macros> | |
4 <import>macros.xml</import> | |
5 </macros> | |
6 <expand macro="edam_ontology"/> | |
7 <expand macro="requirements"/> | |
8 <expand macro="version"/> | |
9 <command detect_errors="exit_code"><![CDATA[ | |
10 humann_regroup_table | |
11 --input '$input' | |
12 --output '$output' | |
13 --function '$function' | |
14 #if $grouping.type == "standard" | |
15 --groups '$grouping.groups' | |
16 #else if $grouping.type == "large" | |
17 --custom '$grouping.grouping.fields.path' | |
18 $grouping.reversed | |
19 #else: | |
20 --custom '$grouping.custom' | |
21 $grouping.reversed | |
22 #end if | |
23 --precision $precision | |
24 --ungrouped '$ungrouped' | |
25 --protected '$protected' | |
26 ]]></command> | |
27 <inputs> | |
28 <param argument="--input" type="data" format="tsv,tabular" label="Gene families table"/> | |
29 <param argument="--function" type="select" label="How to combine grouped features?"> | |
30 <option value="sum" selected="true">Sum</option> | |
31 <option value="mean">Mean</option> | |
32 </param> | |
33 <conditional name="grouping"> | |
34 <param name="type" type="select" label="Grouping"> | |
35 <option value="standard">Basic grouping (to MetaCyc pathways)</option> | |
36 <option value="large">Grouping with larger mapping</option> | |
37 <option value="custom">Grouping with custom mapping</option> | |
38 </param> | |
39 <when value="standard"> | |
40 <param argument="--groups" type="select" label="Grouping"> | |
41 <option value="uniref90_rxn">UniRef90 to MetaCyc pathways</option> | |
42 <option value="uniref50_rxn">UniRef50 to MetaCyc pathways</option> | |
43 </param> | |
44 </when> | |
45 <when value="large"> | |
46 <param name="grouping" type="select" label="Mapping to use for the grouping"> | |
47 <options from_data_table="humann_utility_mapping"> | |
48 <validator message="No utility mapping is available" type="no_options" /> | |
49 <filter type="regexp" column="0" value=".*map.*(?!_name)" keep="true"/> | |
50 </options> | |
51 </param> | |
52 <param argument="--reversed" type="boolean" checked="false" truevalue="--reversed" falsevalue="" label="Mapping from features to groups?"/> | |
53 </when> | |
54 <when value="custom"> | |
55 <param argument="--custom" type="data" format="tsv,txt,tabular" label="Custom mapping file for grouping" help="The format is explained in the help"/> | |
56 <param argument="--reversed" type="boolean" checked="false" truevalue="--reversed" falsevalue="" label="Is the groups file reversed?" help="Mapping from features to groups"/> | |
57 </when> | |
58 </conditional> | |
59 <param argument="--precision" type="integer" value="3" label="Decimal places to round to after applying function"/> | |
60 <param argument="--ungrouped" type="boolean" checked="true" truevalue="Y" falsevalue="N" label="Include an 'UNGROUPED' group to capture features that did not belong to other groups?"/> | |
61 <param argument="--protected" type="boolean" checked="true" truevalue="Y" falsevalue="N" label="Carry through protected features, such as 'UNMAPPED'?"/> | |
62 </inputs> | |
63 <outputs> | |
64 <data name="output" format="tabular"/> | |
65 </outputs> | |
66 <tests> | |
67 <test expect_num_outputs="1"> | |
68 <param name="input" value="demo_genefamilies.tsv"/> | |
69 <param name="function" value="sum"/> | |
70 <conditional name="grouping"> | |
71 <param name="type" value="standard"/> | |
72 <param name="groups" value="uniref90_rxn"/> | |
73 </conditional> | |
74 <param name="precision" value="3"/> | |
75 <param name="ungrouped" value="Y"/> | |
76 <param name="protected" value="Y"/> | |
77 <output name="output" ftype="tabular"> | |
78 <assert_contents> | |
79 <has_text text="2.5.1.19-RXN|g__Bacteroides.s__Bacteroides_vulgatus"/> | |
80 <has_text text="ACETYLGLUTKIN-RXN|g__Bacteroides.s__Bacteroides_vulgatus"/> | |
81 </assert_contents> | |
82 </output> | |
83 </test> | |
84 <test expect_num_outputs="1"> | |
85 <param name="input" value="demo_genefamilies.tsv"/> | |
86 <param name="function" value="mean"/> | |
87 <conditional name="grouping"> | |
88 <param name="type" value="large"/> | |
89 <param name="grouping" value="utility_mapping-full-map_go_uniref90-3.0.0-29042021"/> | |
90 </conditional> | |
91 <param name="precision" value="3"/> | |
92 <param name="ungrouped" value="Y"/> | |
93 <param name="protected" value="Y"/> | |
94 <output name="output" ftype="tabular"> | |
95 <assert_contents> | |
96 <has_text text="GO:0000049|g__Bacteroides.s__Bacteroides_vulgatus" /> | |
97 <has_text text="GO:0003866|g__Bacteroides.s__Bacteroides_vulgatus" /> | |
98 </assert_contents> | |
99 </output> | |
100 </test> | |
101 <test expect_num_outputs="1"> | |
102 <param name="input" value="demo_genefamilies.tsv"/> | |
103 <param name="function" value="sum"/> | |
104 <conditional name="grouping"> | |
105 <param name="type" value="custom"/> | |
106 <!-- file generated using customizemapping file --> | |
107 <param name="custom" value="test-db/utility_mapping/map_go_uniref90.txt"/> | |
108 </conditional> | |
109 <param name="precision" value="3"/> | |
110 <param name="ungrouped" value="Y"/> | |
111 <param name="protected" value="Y"/> | |
112 <output name="output" ftype="tabular"> | |
113 <assert_contents> | |
114 <has_text text="GO:0000049|g__Bacteroides.s__Bacteroides_vulgatus" /> | |
115 <has_text text="GO:0003866|g__Bacteroides.s__Bacteroides_vulgatus" /> | |
116 </assert_contents> | |
117 </output> | |
118 </test> | |
119 </tests> | |
120 <help><![CDATA[ | |
121 @HELP_HEADER@ | |
122 | |
123 This tool takes a table of feature values and a mapping of groups to component features to produce | |
124 a new table with group values in place of feature values. | |
125 | |
126 HUMAnN gene family output can contain a very large number of features depending on the complexity | |
127 of your underlying sample. One way to explore this information in a simplified manner is via HUMAnN's | |
128 own pathway coverage and abundance, which summarize the values of their member genes. However, this | |
129 approach does not apply to gene families that are not associated with metabolic pathways. | |
130 | |
131 To further simplify the exploration of gene family abundance data, users can regroup gene families | |
132 into other functional categories using the current tool. This tool takes as arguments a gene | |
133 family abundance table and a mapping (groups) file that indicates which gene families belong to which | |
134 groups. | |
135 | |
136 Out of the box, HUMAnN can regroup gene families to MetaCyc reactions (a step which is also | |
137 used internally as part of MetaCyc pathway quantification). Users can use additional mapping files | |
138 for both UniRef90 and UniRef50 gene families to the following systems: | |
139 | |
140 - MetaCyc Reactions | |
141 - KEGG Orthogroups (KOs) | |
142 - Pfam domains | |
143 - Level-4 enzyme commission (EC) categories | |
144 - EggNOG (including COGs) | |
145 - Gene Ontology (GO) | |
146 - Informative GO | |
147 | |
148 In most cases, mappings are directly inferred from the annotation of the corresponding UniRef centroid sequence in UniProt. | |
149 | |
150 One exception to this are the "informative GO" (infogo1000) maps: These are informative subsets of GO computed from UniProt's | |
151 annotations and the structure of the GO hierarchy specifically for HUMAnN (each informative GO term has >1,000 UniRef centroids | |
152 annotated to it, but none of its progeny terms have >1,000 centroids so annotated). | |
153 | |
154 If the "UNMAPPED" gene abundance feature is included in a user's input, it will automatically be carried forward to the final output. | |
155 In addition, genes that do not group with a non-trivial feature are combined as an "UNGROUPED" group. By default, UNGROUPED reflects | |
156 the total abundance of genes that did not belong to another group (similar in spirit to the "UNINTEGRATED" value reported in the pathway | |
157 abundance file). | |
158 | |
159 | |
160 Some groups are not associated by default with human-readable names. To attach names to a regrouped table, use the HUMAnN rename tool | |
161 (The "GO" name map can be used for both raw GO and informative GO.) | |
162 | |
163 Inputs | |
164 ====== | |
165 | |
166 Users are free to create and use additional mapping files and pass them to this tool. The format of a mapping file is: | |
167 | |
168 `` | |
169 group1 uniref1 uniref2 uniref3 ... | |
170 `` | |
171 | |
172 `` | |
173 group2 uniref1 uniref5 ... | |
174 `` | |
175 | |
176 Where spaces between items above denote TABS. By default, feature abundances (such as gene families) are summed to produce group abundances. | |
177 | |
178 | |
179 | |
180 ]]></help> | |
181 <expand macro="citations"/> | |
182 </tool> |