comparison data_manager/dada2_fetcher.xml @ 8:0181efacb40a draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/data_managers/data_manager_dada2 commit 5f2ed0407e3adaafc6070fc0594a4685ade094db
author iuc
date Sat, 22 Nov 2025 20:07:44 +0000
parents 678176bff643
children
comparison
equal deleted inserted replaced
7:678176bff643 8:0181efacb40a
1 <?xml version="1.0"?> 1 <tool id="dada2_fetcher" name="dada2 data manager" tool_type="manage_data" version="0.1.2" profile="24.2">
2 <tool id="dada2_fetcher" name="dada2 data manager" tool_type="manage_data" version="0.1.1" profile="23.0">
3 <description>Download reference databases</description> 2 <description>Download reference databases</description>
4 <requirements> 3 <requirements>
5 <requirement type="package" version="3.7">python</requirement> 4 <requirement type="package" version="1.25.0">wget</requirement>
5 <requirement type="package" version="6.0">unzip</requirement>
6 </requirements> 6 </requirements>
7 <command detect_errors="exit_code"><![CDATA[ 7 <command detect_errors="exit_code"><![CDATA[
8 python '$__tool_directory__/data_manager.py' 8 ## see https://github.com/benjjneb/dada2/issues/2053 for the distinction of the _toGenus and _toSpecies datasets
9 --out '$out_file' 9 #set $FILE2TAXURL = {
10 #set dataset = str($db_cond.db_select) + '_' + str($db_cond.version_select) 10 "silva_138.2_toGenus": "https://zenodo.org/records/14169026/files/silva_nr99_v138.2_toGenus_trainset.fa.gz?download=1",
11 --dataset '$dataset' 11 "silva_138.2_toSpecies": "https://zenodo.org/records/14169026/files/silva_nr99_v138.2_toSpecies_trainset.fa.gz?download=1",
12
13 "silva_138.2_fungi_18S_toGenus": "https://zenodo.org/records/15044434/files/SILVA_SSUfungi_nr99_v138_2_toGenus_trainset.fasta?download=1",
14 "silva_138.2_fungi_18S_toSpecies": "https://zenodo.org/records/15044434/files/SILVA_SSUfungi_nr99_v138_2_toSpecies_trainset.fasta?download=1",
15
16 "silva_138.2_fungi_26S_toGenus": "https://zenodo.org/records/15044501/files/SILVA_LSUfungi_nr99_v138_2_toGenus_trainset.fasta?download=1",
17 "silva_138.2_fungi_26S_toSpecies": "https://zenodo.org/records/15044501/files/SILVA_LSUfungi_nr99_v138_2_toSpecies_trainset.fasta?download=1",
18
19 "silva_138": "https://zenodo.org/record/3731176/files/silva_nr_v138_train_set.fa.gz?download=1",
20 "silva_132": "https://zenodo.org/record/1172783/files/silva_nr_v132_train_set.fa.gz?download=1",
21 "silva_128": "https://zenodo.org/record/824551/files/silva_nr_v128_train_set.fa.gz?download=1",
22 "rdp_19_toGenus": "https://zenodo.org/records/14168771/files/rdp_19_toGenus_trainset.fa.gz?download=1",
23 "rdp_19_toSpecies": "https://zenodo.org/records/14168771/files/rdp_19_toSpecies_trainset.fa.gz?download=1",
24 "rdp_16": "https://zenodo.org/record/801828/files/rdp_train_set_16.fa.gz?download=1",
25 "rdp_14": "https://zenodo.org/record/158955/files/rdp_train_set_14.fa.gz?download=1",
26 "unite_8.0_fungi": "https://s3.hpc.ut.ee/plutof-public/original/9f7b41c3-825b-4db8-9c52-74a4603a860a.zip",
27 "unite_8.0_fungi_singletons": "https://s3.hpc.ut.ee/plutof-public/original/53dfc9ce-9cb5-4205-84bb-f47faff26462.zip",
28 "greengenes_13.84": "https://zenodo.org/record/158955/files/gg_13_8_train_set_97.fa.gz?download=1",
29 "greengenes2_2024.09_toGenus": "https://zenodo.org/records/14169078/files/gg2_2024_09_toGenus_trainset.fa.gz?download=1",
30 "greengenes2_2024.09_toSpecies": "https://zenodo.org/records/14169078/files/gg2_2024_09_toSpecies_trainset.fa.gz?download=1",
31 "RefSeq_RDP_2018_05": "https://zenodo.org/record/2541239/files/RefSeq-RDP16S_v2_May2018.fa.gz?download=1",
32
33 "gtdb_202_toGenus": "https://zenodo.org/records/4735821/files/GTDB_bac120_arc122_ssu_r202_Genus.fa.gz?download=1",
34 "gtdb_202_toSpecies": "https://zenodo.org/records/4735821/files/GTDB_bac120_arc122_ssu_r202_Species.fa.gz?download=1",
35 "gtdb_2018_11": "https://zenodo.org/record/2541239/files/GTDB_bac-arc_ssu_r86.fa.gz?download=1",
36
37 "hitdb_1": "https://zenodo.org/record/159205/files/hitdb_v1.00.fa.gz?download=1",
38 "silva_euk_18S_132": "https://zenodo.org/record/1447330/files/silva_132.18s.99_rep_set.dada2.fa.gz?download=1",
39 "PR2_4.11.1": "https://github.com/pr2database/pr2database/releases/download/4.11.1/pr2_version_4.11.1_dada2.fasta.gz"
40 }
41 ## rdp_19 not available for assignSpecies https://github.com/benjjneb/dada2/issues/2053#issuecomment-2512185929
42 #set FILE2SPECIESURL = {
43 "silva_138.2": "https://zenodo.org/records/14169026/files/silva_v138.2_assignSpecies.fa.gz?download=1",
44 "silva_138.2_fungi_18S": "https://zenodo.org/records/15044434/files/SILVA_SSUfungi_assignSpecies.fasta?download=1",
45 "silva_138.2_fungi_26S": "https://zenodo.org/records/15044501/files/SILVA_LSUfungi_assignSpecies.fasta?download=1",
46 "silva_138": "https://zenodo.org/record/3731176/files/silva_species_assignment_v138.fa.gz?download=1",
47 "silva_132": "https://zenodo.org/record/1172783/files/silva_species_assignment_v132.fa.gz?download=1",
48 "silva_128": "https://zenodo.org/record/824551/files/silva_species_assignment_v128.fa.gz?download=1",
49 "rdp_16": "https://zenodo.org/record/801828/files/rdp_species_assignment_16.fa.gz?download=1",
50 "rdp_14": "https://zenodo.org/record/158955/files/rdp_species_assignment_14.fa.gz?download=1",
51 "gtdb_202": "https://zenodo.org/records/4735821/files/GTDB_bac120_arc122_ssu_r202_fullTaxo.fa.gz?download=1",
52 "gtdb_2018_11": "https://zenodo.org/records/2658728/files/GTDB_dada2_assignment_species.fa.gz?download=1"
53 }
54 mkdir -p '${out_file.extra_files_path}' &&
55 cd '${out_file.extra_files_path}' &&
56 #for $database in $taxonomy_databases:
57 wget '$FILE2TAXURL[str($database)]' -O '${database}.taxonomy' &&
58 #if str($database).startswith("unite")
59 unzip -p '${database}.taxonomy' "*.fasta" -x "developer/*" > tmp &&
60 mv tmp '${database}.taxonomy' &&
61 #end if
62 #end for
63 #if $species_databases
64 #for $database in $species_databases:
65 wget '$FILE2SPECIESURL[str($database)]' -O '${database}.species' &&
66 #end for
67 #end if
68 cp '$dmjson' '$out_file'
12 ]]> 69 ]]>
13 </command> 70 </command>
71 <configfiles>
72 <configfile name="dmjson"><![CDATA[#slurp
73 #set FILE2NAME = {
74 "silva_138.2_toGenus": "Silva version 138.2 to Genus (for short reads)",
75 "silva_138.2_toSpecies": "Silva version 138.2 to Species (for long reads)",
76 "silva_138.2": "Silva version 138.2",
77
78 "silva_138.2_fungi_18S_toGenus": "Silva version 138.2 for Fungi 18S to Genus (for short reads)",
79 "silva_138.2_fungi_18S_toSpecies": "Silva version 138.2 for Fungi 18S to Species (for long reads)",
80 "silva_138.2_fungi_18S": "Silva version 138.2 for Fungi 18S",
81
82 "silva_138.2_fungi_26S_toGenus": "Silva version 138.2 for Fungi 26S to Genus (for short reads)",
83 "silva_138.2_fungi_26S_toSpecies": "Silva version 138.2 for Fungi 26S to Species (for long reads)",
84 "silva_138.2_fungi_26S": "Silva version 138.2 for Fungi 26S",
85
86 "silva_138": "Silva version 138",
87 "silva_132": "Silva version 132",
88 "silva_128": "Silva version 128",
89 "rdp_19_toGenus": "RDP trainset 19 to Genus (for short reads)",
90 "rdp_19_toSpecies": "RDP trainset 19 to Species (for long reads)",
91 "rdp_16": "RDP trainset 16",
92 "rdp_14": "RDP trainset 14",
93 "greengenes_13.84": "GreenGenes version 13.84",
94 "greengenes2_2024.09_toGenus": "GreenGenes2 release 2024.09 to Genus (for short reads)",
95 "greengenes2_2024.09_toSpecies": "GreenGenes2 release 2024.09 to Species (for long reads)",
96 "unite_8.0_fungi": "UNITE: General Fasta release 8.0 for Fungi",
97 "unite_8.0_fungi_singletons": "UNITE: General Fasta release 8.0 for Fungi including global and 97% singletons",
98 "RefSeq_RDP_2018_05": "NCBI RefSeq 16S rRNA database supplemented by RDP (05/2018)",
99
100 "gtdb_202_toGenus": "GTDB Version 202 to Genus (for short reads)",
101 "gtdb_202_toSpecies": "GTDB Version 202 to Species (for long reads)",
102 "gtdb_202": "GTDB Version 202",
103
104 "gtdb_2018_11": "GTDB: Genome Taxonomy Database (Bacteria & Archaea) (11/2018)",
105 "hitdb_1": "HitDB version 1 (Human InTestinal 16S rRNA)",
106 "silva_euk_18S_132": "Silva version 132 Eukaryotic 18S",
107 "PR2_4.11.1": "Protist Ribosomal Reference database (PR2) 4.11.1"
108 }
109 #set FILE2TAXLEVELS = {
110 "PR2_4.11.1": "Kingdom,Supergroup,Division,Class,Order,Family,Genus,Species",
111 }
112 {
113 "data_tables":{
114 "dada2_taxonomy": [
115 #for $i, $database in enumerate($taxonomy_databases):
116 #set taxlevels = FILE2TAXLEVELS.get(str($database), "Kingdom,Phylum,Class,Order,Family,Genus,Species")
117 {
118 "value": "$database",
119 "name": "$FILE2NAME[str($database)]",
120 "path": "${database}.taxonomy",
121 "taxlevels": "$taxlevels"
122 }#slurp
123 #if i + 1 < len(str($taxonomy_databases).split(","))
124 ,
125 #end if
126 #end for
127 ]
128 #if $species_databases
129 , "dada2_species": [
130 #for $i, $database in enumerate($species_databases):
131 {
132 "value": "$database",
133 "name": "$FILE2NAME[str($database)]",
134 "path": "${database}.species"
135 }#slurp
136 #if i + 1 < len(str($species_databases).split(","))
137 ,
138 #end if
139 #end for
140 ]
141 #end if
142 }
143 }
144 ]]></configfile>
145 </configfiles>
14 <inputs> 146 <inputs>
15 <conditional name="db_cond"> 147 <param name="taxonomy_databases" multiple="true" type="select" label="Taxonomic database" help="for assignTaxonomy">
16 <param name="db_select" type="select" label="Taxonomic database"> 148 <option value="silva_138.2_toGenus">Silva 138.2 to Genus (for short reads)</option>
17 <option value="silva">Silva</option> 149 <option value="silva_138.2_toSpecies">Silva 138.2 to Species (for long reads)</option>
18 <option value="rdp">RDP</option> 150
19 <option value="greengenes">GreenGenes</option> 151 <option value="silva_138.2_fungi_18S_toGenus">Silva 138.2 for Fungi 18S to Genus (for short reads)</option>
20 <option value="unite">UNITE Fungi: General Fasta</option> 152 <option value="silva_138.2_fungi_18S_toSpecies">Silva 138.2 for Fungi 18S to Species (for long read)</option>
21 <!-- UNITE Eukaryotes not yet supported https://github.com/benjjneb/dada2/issues/702 --> 153
22 <option value="RefSeq_RDP">NCBI RefSeq 16S rRNA database supplemented by RDP</option> 154 <option value="silva_138.2_fungi_26S_toGenus">Silva 138.2 for Fungi 26S to Genus (for short reads)</option>
23 <option value="gtdb">GTDB: Genome Taxonomy Database (Bacteria &amp; Archaea)</option> 155 <option value="silva_138.2_fungi_26S_toSpecies">Silva 138.2 for Fungi 26S to Species (for long reads)</option>
24 <option value="hitdb">HitDB (Human InTestinal 16S)</option> 156
25 <option value="silva_euk_18S">Silva Eukaryotic 18S</option> 157 <option value="silva_138">Silva 138</option>
26 <option value="PR2">Protist Ribosomal Reference database (PR2)</option> 158 <option value="silva_132">Silva 132</option>
27 </param> 159 <option value="silva_128">Silva 128</option>
28 <when value="silva"> 160 <option value="rdp_19_toGenus">RDP 19 to Genus (for short reads)</option>
29 <param name="version_select" type="select" label="Database version"> 161 <option value="rdp_19_toSpecies">RDP 19 to Species (for long reads)</option>
30 <option value="138">138</option> 162 <option value="rdp_16">RDP 16</option>
31 <option value="132">132</option> 163 <option value="rdp_14">RDP 14</option>
32 <option value="128">128</option> 164 <option value="greengenes2_2024.09_toGenus">GreenGenes2 2024.09 to Genus (for short reads)</option>
33 </param> 165 <option value="greengenes2_2024.09_toSpecies">GreenGenes2 2024.09 to Species (for long reads)</option>
34 </when> 166 <option value="greengenes_13.84">GreenGenes 13.84</option>
35 <when value="rdp"> 167 <option value="unite_8.0_fungi">UNITE Fungi: General Fasta 8.0 for Fungi</option>
36 <param name="version_select" type="select" label="Database version"> 168 <option value="unite_8.0_fungi_singletons">UNITE Fungi: General Fasta release 8.0 for Fungi including global and 97% singletons</option>
37 <option value="16">16</option> 169 <!-- UNITE Eukaryotes not yet supported https://github.com/benjjneb/dada2/issues/702 -->
38 <option value="14">14</option> 170 <option value="RefSeq_RDP_2018_05">NCBI RefSeq 16S rRNA database supplemented by RDP 05/2018</option>
39 </param> 171 <option value="gtdb_202_toGenus">GTDB: Genome Taxonomy Database 202 to Genus (for short reads) </option>
40 </when> 172 <option value="gtdb_202_toSpecies">GTDB: Genome Taxonomy Database 202 to Species (for long reads) </option>
41 <when value="greengenes"> 173 <option value="gtdb_2018_11">GTDB: Genome Taxonomy Database 11/2018</option>
42 <param name="version_select" type="select" label="Database version"> 174 <option value="hitdb_1">HitDB (Human InTestinal 16S) 1</option>
43 <option value="13.84">13.84</option> 175 <option value="silva_euk_18S_132">Silva Eukaryotic 18S 132</option>
44 </param> 176 <option value="PR2_4.11.1">Protist Ribosomal Reference database (PR2) 4.11.1</option>
45 </when> 177 </param>
46 <when value="unite"> 178 <param name="species_databases" type="select" multiple="true" optional="true" label="Species databases" help="for addSpecies">
47 <param name="version_select" type="select" label="Database version"> 179 <option value="silva_138.2">Silva 138.2</option>
48 <option value="8.0_fungi">release 8.0 for Fungi</option> 180 <option value="silva_138.2_fungi_18S">Silva 138.2 for Fungi 18S</option>
49 <option value="8.0_fungi_singletons">release 8.0 for Fungi including global and 97% singletons</option> 181 <option value="silva_138.2_fungi_26S">Silva 138.2 for Fungi 26S</option>
50 </param> 182 <option value="silva_138">Silva 138</option>
51 </when> 183 <option value="silva_132">Silva 132</option>
52 <when value="RefSeq_RDP"> 184 <option value="silva_128">Silva 128</option>
53 <param name="version_select" type="select" label="Database version"> 185 <option value="rdp_16">RDP 16</option>
54 <option value="2018_05">05/2018</option> 186 <option value="rdp_14">RDP 14</option>
55 </param> 187 <option value="gtdb_202">GTDB: Genome Taxonomy Database 202</option>
56 </when> 188 <option value="gtdb_2018_11">GTDB: Genome Taxonomy Database 11/2018</option>
57 <when value="gtdb"> 189 </param>
58 <param name="version_select" type="select" label="Database version">
59 <option value="2018_11">11/2018</option>
60 </param>
61 </when>
62 <when value="hitdb">
63 <param name="version_select" type="select" label="Database version">
64 <option value="1">1</option>
65 </param>
66 </when>
67 <when value="silva_euk_18S">
68 <param name="version_select" type="select" label="Database version">
69 <option value="132">132</option>
70 </param>
71 </when>
72 <when value="PR2">
73 <param name="version_select" type="select" label="Database version">
74 <option value="4.11.1">4.11.1</option>
75 </param>
76 </when>
77 </conditional>
78 </inputs> 190 </inputs>
79 <outputs> 191 <outputs>
80 <data name="out_file" format="data_manager_json" /> 192 <data name="out_file" format="data_manager_json" />
81 </outputs> 193 </outputs>
82 <tests> 194 <tests>
83 <test> 195 <test>
84 <param name="db_cond|db_select" value="silva"/> 196 <param name="taxonomy_databases" value="silva_138.2_toGenus,silva_138.2_toSpecies"/>
85 <param name="db_cond|version_select" value="138"/> 197 <param name="species_databases" value="silva_138.2"/>
198 <output name="out_file">
199 <assert_contents>
200 <has_text text="&quot;Silva version 138.2 to Genus (for short reads)&quot;"/>
201 <has_text text="&quot;Silva version 138.2 to Species (for long reads)&quot;"/>
202 <has_text text="&quot;Silva version 138.2&quot;"/>
203 </assert_contents>
204 </output>
205 <assert_command>
206 <has_text text="wget" n="3"/>
207 </assert_command>
208 </test>
209
210 <test>
211 <param name="taxonomy_databases" value="silva_138.2_fungi_18S_toGenus,silva_138.2_fungi_18S_toSpecies"/>
212 <param name="species_databases" value="silva_138.2_fungi_18S"/>
213 <output name="out_file">
214 <assert_contents>
215 <has_text text="&quot;Silva version 138.2 for Fungi 18S to Genus (for short reads)&quot;"/>
216 <has_text text="&quot;Silva version 138.2 for Fungi 18S to Species (for long reads)&quot;"/>
217 <has_text text="&quot;Silva version 138.2 for Fungi 18S&quot;"/>
218 </assert_contents>
219 </output>
220 <assert_command>
221 <has_text text="wget" n="3"/>
222 </assert_command>
223 </test>
224 <test>
225 <param name="taxonomy_databases" value="silva_138.2_fungi_26S_toGenus,silva_138.2_fungi_26S_toSpecies"/>
226 <param name="species_databases" value="silva_138.2_fungi_26S"/>
227 <output name="out_file">
228 <assert_contents>
229 <has_text text="&quot;Silva version 138.2 for Fungi 26S to Genus (for short reads)&quot;"/>
230 <has_text text="&quot;Silva version 138.2 for Fungi 26S to Species (for long reads)&quot;"/>
231 <has_text text="&quot;Silva version 138.2 for Fungi 26S&quot;"/>
232 </assert_contents>
233 </output>
234 <assert_command>
235 <has_text text="wget" n="3"/>
236 </assert_command>
237 </test>
238
239 <test>
240 <param name="taxonomy_databases" value="silva_138"/>
241 <param name="species_databases" value="silva_138"/>
86 <output name="out_file" file="silva138_json"/> 242 <output name="out_file" file="silva138_json"/>
87 </test> 243 <assert_command>
88 <test> 244 <has_text text="wget" n="2"/>
89 <param name="db_cond|db_select" value="silva"/> 245 </assert_command>
90 <param name="db_cond|version_select" value="132"/> 246 </test>
247 <test>
248 <param name="taxonomy_databases" value="silva_132"/>
249 <param name="species_databases" value="silva_132"/>
91 <output name="out_file" file="silva132_json"/> 250 <output name="out_file" file="silva132_json"/>
92 </test> 251 <assert_command>
93 <test> 252 <has_text text="wget" n="2"/>
94 <param name="db_cond|db_select" value="rdp"/> 253 </assert_command>
95 <param name="db_cond|version_select" value="16"/> 254 </test>
255 <test>
256 <param name="taxonomy_databases" value="rdp_19_toSpecies,rdp_19_toGenus"/>
257 <output name="out_file">
258 <assert_contents>
259 <has_text text="RDP trainset 19 to Species (for long reads)"/>
260 <has_text text="RDP trainset 19 to Genus (for short reads)"/>
261 </assert_contents>
262 </output>
263 <assert_command>
264 <has_text text="wget" n="2"/>
265 </assert_command>
266 </test>
267 <test>
268 <param name="taxonomy_databases" value="rdp_16"/>
269 <param name="species_databases" value="rdp_16"/>
96 <output name="out_file" file="rdp16_json"/> 270 <output name="out_file" file="rdp16_json"/>
97 </test> 271 <assert_command>
98 <test> 272 <has_text text="wget" n="2"/>
99 <param name="db_cond|db_select" value="greengenes"/> 273 </assert_command>
100 <param name="db_cond|version_select" value="13.84"/> 274 </test>
275 <test>
276 <param name="taxonomy_databases" value="greengenes2_2024.09_toSpecies,greengenes2_2024.09_toGenus"/>
277 <output name="out_file">
278 <assert_contents>
279 <has_text text="GreenGenes2 release 2024.09 to Genus (for short reads)"/>
280 <has_text text="GreenGenes2 release 2024.09 to Species (for long reads)"/>
281 </assert_contents>
282 </output>
283 <assert_command>
284 <has_text text="wget" n="2"/>
285 </assert_command>
286 </test>
287 <test>
288 <param name="taxonomy_databases" value="greengenes_13.84"/>
101 <output name="out_file" file="greengenes13.84_json"/> 289 <output name="out_file" file="greengenes13.84_json"/>
102 </test> 290 <assert_command>
103 <test> 291 <has_text text="wget" n="1"/>
104 <param name="db_cond|db_select" value="unite"/> 292 </assert_command>
105 <param name="db_cond|version_select" value="8.0_fungi"/> 293 </test>
294 <test>
295 <param name="taxonomy_databases" value="unite_8.0_fungi"/>
106 <output name="out_file" file="unite8fungi_json"/> 296 <output name="out_file" file="unite8fungi_json"/>
107 </test> 297 <assert_command>
108 <test> 298 <has_text text="unzip"/>
109 <param name="db_cond|db_select" value="unite"/> 299 </assert_command>
110 <param name="db_cond|version_select" value="8.0_fungi_singletons"/> 300 </test>
301 <test>
302 <param name="taxonomy_databases" value="unite_8.0_fungi_singletons"/>
111 <output name="out_file" file="unite8fungisingletons_json"/> 303 <output name="out_file" file="unite8fungisingletons_json"/>
112 </test> 304 <assert_command>
113 <test> 305 <has_text text="wget" n="1"/>
114 <param name="db_cond|db_select" value="RefSeq_RDP"/> 306 </assert_command>
115 <param name="db_cond|version_select" value="2018_05"/> 307 </test>
308 <test>
309 <param name="taxonomy_databases" value="RefSeq_RDP_2018_05"/>
116 <output name="out_file" file="RefSeq_RDP2018_json"/> 310 <output name="out_file" file="RefSeq_RDP2018_json"/>
117 </test> 311 <assert_command>
118 <test> 312 <has_text text="wget" n="1"/>
119 <param name="db_cond|db_select" value="gtdb"/> 313 </assert_command>
120 <param name="db_cond|version_select" value="2018_11"/> 314 </test>
315
316 <test>
317 <param name="taxonomy_databases" value="gtdb_202_toGenus,gtdb_202_toSpecies"/>
318 <param name="species_databases" value="gtdb_202"/>
319 <output name="out_file">
320 <assert_contents>
321 <has_text text="&quot;GTDB Version 202 to Genus (for short reads)&quot;"/>
322 <has_text text="&quot;GTDB Version 202 to Species (for long reads)&quot;"/>
323 <has_text text="&quot;GTDB Version 202&quot;"/>
324 </assert_contents>
325 </output>
326 <assert_command>
327 <has_text text="wget" n="3"/>
328 </assert_command>
329 </test>
330
331 <test>
332 <param name="taxonomy_databases" value="gtdb_2018_11"/>
333 <param name="species_databases" value="gtdb_2018_11"/>
121 <output name="out_file" file="gtdb2018_json"/> 334 <output name="out_file" file="gtdb2018_json"/>
122 </test> 335 <assert_command>
123 <test> 336 <has_text text="wget" n="2"/>
124 <param name="db_cond|db_select" value="hitdb"/> 337 </assert_command>
125 <param name="db_cond|version_select" value="1"/> 338 </test>
339 <test>
340 <param name="taxonomy_databases" value="hitdb_1"/>
126 <output name="out_file" file="hitdb1_json"/> 341 <output name="out_file" file="hitdb1_json"/>
127 </test> 342 <assert_command>
128 <test> 343 <has_text text="wget" n="1"/>
129 <param name="db_cond|db_select" value="silva_euk_18S"/> 344 </assert_command>
130 <param name="db_cond|version_select" value="132"/> 345 </test>
346 <test>
347 <param name="taxonomy_databases" value="silva_euk_18S_132"/>
131 <output name="out_file" file="silvaeuk132_json"/> 348 <output name="out_file" file="silvaeuk132_json"/>
132 </test> 349 <assert_command>
133 <test> 350 <has_text text="wget" n="1"/>
134 <param name="db_cond|db_select" value="PR2"/> 351 </assert_command>
135 <param name="db_cond|version_select" value="4.11.1"/> 352 </test>
353 <test>
354 <param name="taxonomy_databases" value="PR2_4.11.1"/>
136 <output name="out_file" file="PR24.11.1_json"/> 355 <output name="out_file" file="PR24.11.1_json"/>
356 <assert_command>
357 <has_text text="wget" n="1"/>
358 </assert_command>
137 </test> 359 </test>
138 </tests> 360 </tests>
139 <help><![CDATA[ 361 <help><![CDATA[
140 Public Reference databases maintained by the DADA2 project 362 Public Reference databases maintained by the DADA2 project
141 .......................................................... 363 ..........................................................
142 364
143 The following refrence databases which are describes as maintained by the DADA2 project (https://benjjneb.github.io/dada2/training.html) are available 365 The following refrence databases which are describes as maintained by the DADA2 project (https://benjjneb.github.io/dada2/training.html) are available
144 366
145 - Silva (https://www.arb-silva.de/) 367 - Silva
146 - RDP 368 - RDP
147 - GreenGenes (http://greengenes.secondgenome.com/) 369 - GreenGenes (https://web.archive.org/web/20240703054246/https://greengenes.secondgenome.com/)
370 - Greengenes2 (https://greengenes2.ucsd.edu/)
148 - UNITE general FASTA (https://unite.ut.ee/repository.php) 371 - UNITE general FASTA (https://unite.ut.ee/repository.php)
149 372
150 While Silva and RDP contain reference databases for taxonomy and species assignment, the greengenes and UNITE databases only contains a reference database for taxonomy assignment. 373 While Silva and RDP contain reference databases for taxonomy and species assignment, the greengenes and UNITE databases only contains a reference database for taxonomy assignment.
151 374
152 For the Silva databases check the license information: http://www.arb-silva.de/silva-license-information. 375 Silva are licensed under Create Commons Attribution 4.0 (CC-BY 4.0) since release 138.
153 376
154 Except for UNITE all reference databases are downloaded from the corresponding zenodo links that are listed on the DADA2 website. The UNITE databases are taken from the links provided on the UNITE website 377 Except for UNITE all reference databases are downloaded from the corresponding zenodo links that are listed on the DADA2 website. The UNITE databases are taken from the links provided on the UNITE website
155 378
156 More detailed informations in the reference data bases can be found on the DADA2 website and contained links: https://benjjneb.github.io/dada2/training.html. 379 More detailed informations in the reference data bases can be found on the DADA2 website and contained links: https://benjjneb.github.io/dada2/training.html.
157 380
174 <citations> 397 <citations>
175 <!-- silva --> 398 <!-- silva -->
176 <citation type="doi">10.1093/nar/gks1219</citation> 399 <citation type="doi">10.1093/nar/gks1219</citation>
177 <!-- rdp --> 400 <!-- rdp -->
178 <citation type="doi">10.1093/nar/gkt1244</citation> 401 <citation type="doi">10.1093/nar/gkt1244</citation>
402 <!-- greengenes2 -->
403 <citation type="doi">10.1038/s41587-023-01845-1</citation>
179 <!-- greengenes --> 404 <!-- greengenes -->
180 <citation type="doi">10.1128/AEM.03006-05</citation> 405 <citation type="doi">10.1128/AEM.03006-05</citation>
181 <!-- unite --> 406 <!-- unite -->
182 <citation type="doi">10.15156/BIO/786343</citation> 407 <citation type="doi">10.15156/BIO/786343</citation>
183 <!-- TODO gtdb ??? --> 408 <!-- TODO gtdb ??? -->