comparison datasets_genome.xml @ 21:0f3b3813b6ae draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/ncbi_datasets commit c1c3f90e4aa7dc258aa61d98ec4eac0b97eef426
author iuc
date Mon, 21 Jul 2025 19:28:16 +0000
parents da8260eba74b
children
comparison
equal deleted inserted replaced
20:7b925f7c50b2 21:0f3b3813b6ae
2 <description>download genome sequence, annotation and metadata</description> 2 <description>download genome sequence, annotation and metadata</description>
3 <macros> 3 <macros>
4 <import>macros.xml</import> 4 <import>macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="bio_tools"/> 6 <expand macro="bio_tools"/>
7 <expand macro="requirements"></expand> 7 <expand macro="requirements"/>
8 <expand macro="version_command"/> 8 <expand macro="version_command"/>
9 <command><![CDATA[ 9 <stdio>
10 <regex match="Warning" source="stderr" level="warning" description=""/>
11 <regex match="skipping" source="stderr" level="warning" description=""/>
12 <regex match="ERROR" level="fatal"/>
13 </stdio>
14 <command detect_errors="exit_code"><![CDATA[
10 #import re 15 #import re
11 @SETUP_CERTIFICATES@ 16 @SETUP_CERTIFICATES@
12 datasets download genome $query.subcommand.download_by 17 datasets download genome $query.subcommand.download_by
13 #if $query.subcommand.download_by == 'accession': 18 #if $query.subcommand.download_by == 'accession':
14 #if $query.subcommand.text_or_file.text_or_file == 'text': 19 #if $query.subcommand.text_or_file.text_or_file == 'text':
114 <option value="only" selected="false">Limit to MAGs</option> 119 <option value="only" selected="false">Limit to MAGs</option>
115 <option value="exclude" selected="false">Exclude MAGs</option> 120 <option value="exclude" selected="false">Exclude MAGs</option>
116 </param> 121 </param>
117 <expand macro="released_options"/> 122 <expand macro="released_options"/>
118 <expand macro="released_options" before_or_after="after"/> 123 <expand macro="released_options" before_or_after="after"/>
119
120 <repeat name="search" title="Add search terms"> 124 <repeat name="search" title="Add search terms">
121 <param argument="--search" type="text" label="Only include genomes that have the specified text in the searchable fields" help="Searchable fields are species and infraspecies, assembly name and submitter"/> 125 <param argument="--search" type="text" label="Only include genomes that have the specified text in the searchable fields" help="Searchable fields are species and infraspecies, assembly name and submitter"/>
122 </repeat> 126 </repeat>
123 </section> 127 </section>
124 <section name="file_choices" title="Output options" expanded="true"> 128 <section name="file_choices" title="Output options" expanded="true">
135 </section> 139 </section>
136 </inputs> 140 </inputs>
137 <outputs> 141 <outputs>
138 <data name="genome_data_report" format="tabular" label="NCBI Genome Datasets: Data Report" from_work_dir="genome_data_report.tsv"/> 142 <data name="genome_data_report" format="tabular" label="NCBI Genome Datasets: Data Report" from_work_dir="genome_data_report.tsv"/>
139 <collection name="sequence_report" label="NCBI Genome Datasets: Sequence Data Report" type="list"> 143 <collection name="sequence_report" label="NCBI Genome Datasets: Sequence Data Report" type="list">
140 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/sequence_report.tsv" ext="tabular" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 144 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/sequence_report.tsv" ext="tabular" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
141 <filter>file_choices['include'] and "seq-report" in file_choices['include']</filter> 145 <filter>file_choices['include'] and "seq-report" in file_choices['include']</filter>
142 </collection> 146 </collection>
143 <collection name="genome_fasta" label="NCBI Genome Datasets: genome fasta" type="list:list"> 147 <collection name="genome_fasta" label="NCBI Genome Datasets: genome fasta" type="list:list">
144 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)/(?!rna|cds_from)(?P&lt;identifier_1&gt;.*?)(_genomic)?\.(?P&lt;ext&gt;fasta(\.gz)?)" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 148 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)/(?!rna|cds_from)(?P&lt;identifier_1&gt;.*?)(_genomic)?\.(?P&lt;ext&gt;fasta(\.gz)?)" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
145 <filter>file_choices['include'] and "genome" in file_choices['include']</filter> 149 <filter>file_choices['include'] and "genome" in file_choices['include']</filter>
146 </collection> 150 </collection>
147 <collection name="rna_fasta" label="NCBI Genome Datasets: RNA fasta" type="list"> 151 <collection name="rna_fasta" label="NCBI Genome Datasets: RNA fasta" type="list">
148 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/rna\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 152 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/rna\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
149 <filter>file_choices['include'] and "rna" in file_choices['include']</filter> 153 <filter>file_choices['include'] and "rna" in file_choices['include']</filter>
150 </collection> 154 </collection>
151 <collection name="protein_fasta" label="NCBI Genome Datasets: protein fasta" type="list"> 155 <collection name="protein_fasta" label="NCBI Genome Datasets: protein fasta" type="list">
152 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/protein\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 156 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/protein\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
153 <filter>file_choices['include'] and "protein" in file_choices['include']</filter> 157 <filter>file_choices['include'] and "protein" in file_choices['include']</filter>
154 </collection> 158 </collection>
155 <collection name="genomic_cds" label="NCBI Genome Datasets: genomic cds fasta" type="list"> 159 <collection name="genomic_cds" label="NCBI Genome Datasets: genomic cds fasta" type="list">
156 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/cds_from_genomic\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 160 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/cds_from_genomic\.(?P&lt;ext&gt;fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
157 <filter>file_choices['include'] and "cds" in file_choices['include']</filter> 161 <filter>file_choices['include'] and "cds" in file_choices['include']</filter>
158 </collection> 162 </collection>
159 <collection name="genomic_gff" label="NCBI Genome Datasets: genomic gff3" type="list"> 163 <collection name="genomic_gff" label="NCBI Genome Datasets: genomic gff3" type="list">
160 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gff" ext="gff3" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 164 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gff" ext="gff3" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
161 <filter>file_choices['include'] and "gff3" in file_choices['include']</filter> 165 <filter>file_choices['include'] and "gff3" in file_choices['include']</filter>
162 </collection> 166 </collection>
163 <collection name="genomic_gtf" label="NCBI Genome Datasets: gtf" type="list"> 167 <collection name="genomic_gtf" label="NCBI Genome Datasets: gtf" type="list">
164 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gtf" ext="gtf" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 168 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gtf" ext="gtf" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
165 <filter>file_choices['include'] and "gtf" in file_choices['include']</filter> 169 <filter>file_choices['include'] and "gtf" in file_choices['include']</filter>
166 </collection> 170 </collection>
167 <collection name="genomic_gbff" label="NCBI Genome Datasets: GenBank flatfile" type="list"> 171 <collection name="genomic_gbff" label="NCBI Genome Datasets: GenBank flatfile" type="list">
168 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gbff" ext="txt" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> 172 <discover_datasets pattern="(?P&lt;identifier_0&gt;.*?)\/genomic\.gbff" ext="txt" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/>
169 <filter>file_choices['include'] and "gbff" in file_choices['include']</filter> 173 <filter>file_choices['include'] and "gbff" in file_choices['include']</filter>
170 </collection> 174 </collection>
171 </outputs> 175 </outputs>
172 <tests> 176 <tests>
173 <test expect_num_outputs="3"> 177 <test expect_num_outputs="3">
174 <conditional name="query|subcommand"> 178 <conditional name="query|subcommand">
175 <param name="download_by" value="taxon"/> 179 <param name="download_by" value="taxon"/>
176 <param name="taxon_positional" value="human"/> 180 <param name="taxon_positional" value="human"/>
177 </conditional> 181 </conditional>
178 <param name="chromosomes" value="21"/> 182 <section name="filters">
179 <param name="released_before" value="01/01/2018"/> 183 <param name="chromosomes" value="21"/>
184 <param name="released_before" value="01/01/2018"/>
185 </section>
180 <section name="file_choices"> 186 <section name="file_choices">
181 <!-- include a sequence (which should be downloaded as fasta.gz) 187 <!-- include a sequence (which should be downloaded as fasta.gz)
182 and one non-sequence (which should be decompressed) output --> 188 and one non-sequence (which should be decompressed) output -->
183 <param name="include" value="rna,gff3"/> 189 <param name="include" value="rna,gff3"/>
184 </section> 190 </section>
185 <output name="genome_data_report"> 191 <output name="genome_data_report">
186 <assert_contents> 192 <assert_contents>
187 <has_text text="Assembly Accession&#009;Assembly Name&#009;Assembly Submitter&#009;Organism Name"/> 193 <has_text text="Assembly Accession&#9;Assembly Name&#9;Assembly Submitter&#9;Organism Name"/>
188 <has_n_lines n="142"/> 194 <has_n_lines n="142"/>
189 <has_n_columns n="4"/> 195 <has_n_columns n="4"/>
190 </assert_contents> 196 </assert_contents>
191 </output> 197 </output>
192 <output_collection name="rna_fasta" type="list" count="1"> 198 <output_collection name="rna_fasta" type="list" count="2">
193 <element name="GCF_000306695.2" decompress="true"> 199 <element name="GCF_000306695.2" decompress="true">
194 <assert_contents> 200 <assert_contents>
195 <has_text text=">"/> 201 <has_text text="&gt;"/>
196 </assert_contents> 202 </assert_contents>
197 </element> 203 </element>
198 </output_collection> 204 </output_collection>
199 <output_collection name="genomic_gff" type="list"> 205 <output_collection name="genomic_gff" type="list" count="12">
200 <element name="GCF_000306695.2"> 206 <element name="GCF_000306695.2">
201 <assert_contents> 207 <assert_contents>
202 <has_n_lines min="1000000"/> 208 <has_n_lines min="1000000"/>
203 <has_line line="##gff-version 3"/> 209 <has_line line="##gff-version 3"/>
204 <has_n_columns n="9" comment="#"/> 210 <has_n_columns n="9" comment="#"/>
212 <test expect_num_outputs="2"> 218 <test expect_num_outputs="2">
213 <conditional name="query|subcommand"> 219 <conditional name="query|subcommand">
214 <param name="download_by" value="taxon"/> 220 <param name="download_by" value="taxon"/>
215 <param name="taxon_positional" value="human"/> 221 <param name="taxon_positional" value="human"/>
216 </conditional> 222 </conditional>
217 <param name="chromosomes" value="21"/> 223 <section name="filters">
218 <param name="assembly_level" value="chromosome,complete"/> 224 <param name="chromosomes" value="21"/>
219 <param name="released_before" value="01/01/2018"/> 225 <param name="assembly_level" value="chromosome,complete"/>
226 <param name="released_before" value="01/01/2018"/>
227 </section>
220 <section name="file_choices"> 228 <section name="file_choices">
221 <param name="include" value="genome"/> 229 <param name="include" value="genome"/>
222 <param name="decompress" value="true"/> 230 <param name="decompress" value="true"/>
223 </section> 231 </section>
224 <output_collection name="genome_fasta" type="list:list" count="12"> 232 <output_collection name="genome_fasta" type="list:list" count="11">
225 <expand macro="genome_fasta_assert" el1="GCA_000002115.2" el2="chr21" expression=">"/> 233 <expand macro="genome_fasta_assert" el1="GCA_000002115.2" el2="chr21" expression="&gt;"/>
226 <expand macro="genome_fasta_assert" el1="GCA_000002125.2" el2="chr21" expression=">"/> 234 <expand macro="genome_fasta_assert" el1="GCA_000002125.2" el2="chr21" expression="&gt;"/>
227 <expand macro="genome_fasta_assert" el1="GCA_000212995.1" el2="chr21" expression=">"/> 235 <expand macro="genome_fasta_assert" el1="GCA_000212995.1" el2="chr21" expression="&gt;"/>
228 <expand macro="genome_fasta_assert" el1="GCA_000252825.1" el2="chr21" expression=">"/> 236 <expand macro="genome_fasta_assert" el1="GCA_000306695.2" el2="chr21" expression="&gt;"/>
229 <expand macro="genome_fasta_assert" el1="GCA_000306695.2" el2="chr21" expression=">"/> 237 <expand macro="genome_fasta_assert" el1="GCA_000365445.1" el2="chr21" expression="&gt;"/>
230 <expand macro="genome_fasta_assert" el1="GCA_000365445.1" el2="chr21" expression=">"/> 238 <expand macro="genome_fasta_assert" el1="GCA_001292825.2" el2="chr21" expression="&gt;"/>
231 <expand macro="genome_fasta_assert" el1="GCA_001292825.2" el2="chr21" expression=">"/> 239 <expand macro="genome_fasta_assert" el1="GCA_001524155.4" el2="chr21" expression="&gt;"/>
232 <expand macro="genome_fasta_assert" el1="GCA_001524155.4" el2="chr21" expression=">"/> 240 <expand macro="genome_fasta_assert" el1="GCA_001712695.1" el2="chr21" expression="&gt;"/>
233 <expand macro="genome_fasta_assert" el1="GCA_001712695.1" el2="chr21" expression=">"/> 241 <expand macro="genome_fasta_assert" el1="GCA_022833125.2" el2="chr21" expression="&gt;"/>
234 <expand macro="genome_fasta_assert" el1="GCA_022833125.2" el2="chr21" expression=">"/> 242 <expand macro="genome_fasta_assert" el1="GCF_000002125.1" el2="chr21" expression="&gt;"/>
235 <expand macro="genome_fasta_assert" el1="GCF_000002125.1" el2="chr21" expression=">"/> 243 <expand macro="genome_fasta_assert" el1="GCF_000306695.2" el2="chr21" expression="&gt;"/>
236 <expand macro="genome_fasta_assert" el1="GCF_000306695.2" el2="chr21" expression=">"/>
237 <!-- According to https://github.com/ncbi/datasets/issues/188, the following should not be included among the returned results anymore 09/2023 --> 244 <!-- According to https://github.com/ncbi/datasets/issues/188, the following should not be included among the returned results anymore 09/2023 -->
238 <!-- 245 <!--
239 <expand macro="genome_fasta_assert" el1="GCA_000442335.2" el2="GCA_000442335.2_LinearCen1.1_normalized" expression=">" expression_n="25"/> 246 <expand macro="genome_fasta_assert" el1="GCA_000442335.2" el2="GCA_000442335.2_LinearCen1.1_normalized" expression=">" expression_n="25"/>
240 <expand macro="genome_fasta_assert" el1="GCA_000002135.3" el2="GCA_000002135.3_CRA_TCAGchr7v2" expression=">"/> 247 <expand macro="genome_fasta_assert" el1="GCA_000002135.3" el2="GCA_000002135.3_CRA_TCAGchr7v2" expression=">"/>
241 --> 248 -->
251 <test expect_failure="true"> 258 <test expect_failure="true">
252 <conditional name="query|subcommand"> 259 <conditional name="query|subcommand">
253 <param name="download_by" value="taxon"/> 260 <param name="download_by" value="taxon"/>
254 <param name="taxon_positional" value="human"/> 261 <param name="taxon_positional" value="human"/>
255 </conditional> 262 </conditional>
256 <param name="chromosomes" value="21"/> 263 <section name="filters">
257 <param name="assembly_level" value="chromosome,complete"/> 264 <param name="chromosomes" value="21"/>
258 <param name="assembly_source" value="refseq"/> 265 <param name="assembly_level" value="chromosome,complete"/>
259 <param name="released_before" value="01/01/2018"/> 266 <param name="assembly_source" value="refseq"/>
267 <param name="released_before" value="01/01/2018"/>
268 </section>
260 <section name="file_choices"> 269 <section name="file_choices">
261 <param name="include" value="genome"/> 270 <param name="include" value="genome"/>
262 <param name="decompress" value="true"/> 271 <param name="decompress" value="true"/>
263 </section> 272 </section>
264 <assert_stderr> 273 <assert_stderr>
286 <conditional name="text_or_file"> 295 <conditional name="text_or_file">
287 <param name="text_or_file" value="text"/> 296 <param name="text_or_file" value="text"/>
288 <param name="accession" value="GCF_000013305.1 GCF_000007445.1"/> 297 <param name="accession" value="GCF_000013305.1 GCF_000007445.1"/>
289 </conditional> 298 </conditional>
290 </conditional> 299 </conditional>
291 <param name="released_before" value="01/01/2007"/> 300 <section name="filters">
301 <param name="released_before" value="01/01/2007"/>
302 </section>
292 <section name="file_choices"> 303 <section name="file_choices">
293 <param name="include" value="seq-report,gtf,cds"/> 304 <param name="include" value="seq-report,gtf,cds"/>
294 <param name="decompress" value="true"/> 305 <param name="decompress" value="true"/>
295 </section> 306 </section>
296 <output name="genome_data_report"> 307 <output name="genome_data_report">
298 <has_text text="GCF_000013305.1"/> 309 <has_text text="GCF_000013305.1"/>
299 <has_n_lines n="3"/> 310 <has_n_lines n="3"/>
300 <has_n_columns n="4"/> 311 <has_n_columns n="4"/>
301 </assert_contents> 312 </assert_contents>
302 </output> 313 </output>
303 <output_collection name="sequence_report" type="list" count="2" > 314 <output_collection name="sequence_report" type="list" count="2">
304 <element name="GCF_000007445.1"> 315 <element name="GCF_000007445.1">
305 <assert_contents> 316 <assert_contents>
306 <has_text text="GCF_000007445.1"/> 317 <has_text text="GCF_000007445.1"/>
307 <has_n_lines n="2"/> 318 <has_n_lines n="2"/>
308 <has_n_columns n="15"/> 319 <has_n_columns n="15"/>
314 <has_n_lines n="2"/> 325 <has_n_lines n="2"/>
315 <has_n_columns n="15"/> 326 <has_n_columns n="15"/>
316 </assert_contents> 327 </assert_contents>
317 </element> 328 </element>
318 </output_collection> 329 </output_collection>
319 <output_collection name="genomic_gtf" type="list"> 330 <output_collection name="genomic_gtf" type="list" count="2">
320 <element name="GCF_000007445.1" file="GCF_000007445.1.genomic.gtf" compare="contains"/> 331 <element name="GCF_000007445.1" file="GCF_000007445.1.genomic.gtf" compare="contains"/>
321 <element name="GCF_000013305.1" file="genome.2.GCF_000013305.1.genomic.gtf" compare="contains"/> 332 <element name="GCF_000013305.1" file="genome.2.GCF_000013305.1.genomic.gtf" compare="contains"/>
322 </output_collection> 333 </output_collection>
323 <output_collection name="genomic_cds" type="list"> 334 <output_collection name="genomic_cds" type="list">
324 <element name="GCF_000007445.1" file="genome.2.GCF_000007445.1.genomic.cds" compare="contains"/> 335 <element name="GCF_000007445.1" file="genome.2.GCF_000007445.1.genomic.cds" compare="contains"/>
331 <conditional name="text_or_file"> 342 <conditional name="text_or_file">
332 <param name="text_or_file" value="file"/> 343 <param name="text_or_file" value="file"/>
333 <param name="inputfile" value="accessions.txt"/> 344 <param name="inputfile" value="accessions.txt"/>
334 </conditional> 345 </conditional>
335 </conditional> 346 </conditional>
336 <param name="released_before" value="01/01/2007"/> 347 <section name="filters">
348 <param name="released_before" value="01/01/2007"/>
349 </section>
337 <section name="file_choices"> 350 <section name="file_choices">
338 <param name="include" value="seq-report,gff3,gbff"/> 351 <param name="include" value="seq-report,gff3,gbff"/>
339 <param name="decompress" value="true"/> 352 <param name="decompress" value="true"/>
340 </section> 353 </section>
341 <output name="genome_data_report"> 354 <output name="genome_data_report">
353 <output_collection name="genomic_gbff" type="list"> 366 <output_collection name="genomic_gbff" type="list">
354 <element name="GCF_000007445.1" file="genome.3.GCF_000007445.1.genomic.gbff" compare="contains"/> 367 <element name="GCF_000007445.1" file="genome.3.GCF_000007445.1.genomic.gbff" compare="contains"/>
355 <element name="GCF_000013305.1" file="genome.3.GCF_000013305.1.genomic.gbff" compare="contains"/> 368 <element name="GCF_000013305.1" file="genome.3.GCF_000013305.1.genomic.gbff" compare="contains"/>
356 </output_collection> 369 </output_collection>
357 </test> 370 </test>
358
359 <!-- should not fail https://github.com/ncbi/datasets/issues/194 --> 371 <!-- should not fail https://github.com/ncbi/datasets/issues/194 -->
360 <test expect_num_outputs="2"> 372 <test expect_num_outputs="2">
361 <conditional name="query|subcommand"> 373 <conditional name="query|subcommand">
362 <param name="download_by" value="accession"/> 374 <param name="download_by" value="accession"/>
363 <conditional name="text_or_file"> 375 <conditional name="text_or_file">
364 <param name="text_or_file" value="text"/> 376 <param name="text_or_file" value="text"/>
365 <param name="accession" value="GCF_000001405"/> 377 <param name="accession" value="GCF_000001405"/>
366 </conditional> 378 </conditional>
367 </conditional> 379 </conditional>
368 <param name="released_before" value="01/01/2015"/> 380 <section name="filters">
369 <param name="assembly_version" value="all"/> 381 <param name="released_before" value="01/01/2015"/>
382 <param name="assembly_version" value="all"/>
383 </section>
370 <section name="file_choices"> 384 <section name="file_choices">
371 <param name="include" value="seq-report"/> 385 <param name="include" value="seq-report"/>
372 </section> 386 </section>
373 <output name="genome_data_report"> 387 <output name="genome_data_report">
374 <!-- assert that we get at least the 16 versions available at the time of writing this test --> 388 <!-- assert that we get at least the 16 versions available at the time of writing this test -->
393 <section name="file_choices"> 407 <section name="file_choices">
394 <param name="include" value="genome,protein,rna,cds"/> 408 <param name="include" value="genome,protein,rna,cds"/>
395 <param name="decompress" value="true"/> 409 <param name="decompress" value="true"/>
396 </section> 410 </section>
397 <output_collection name="genome_fasta" type="list:list" count="1"> 411 <output_collection name="genome_fasta" type="list:list" count="1">
398 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc] (mitochondrion|chromosome .*), complete (sequence|genome)" expression_n="17"/> 412 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression="&gt;NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc] (mitochondrion|chromosome .*), complete (sequence|genome)" expression_n="17"/>
399 </output_collection> 413 </output_collection>
400 <output_collection name="protein_fasta" type="list" count="1"> 414 <output_collection name="protein_fasta" type="list" count="1">
401 <element name="GCF_000146045.2" decompress="true"> 415 <element name="GCF_000146045.2" decompress="true">
402 <assert_contents> 416 <assert_contents>
403 <has_text text=">"/> 417 <has_text text="&gt;"/>
404 </assert_contents> 418 </assert_contents>
405 </element> 419 </element>
406 </output_collection> 420 </output_collection>
407 <output_collection name="rna_fasta" type="list" count="1"> 421 <output_collection name="rna_fasta" type="list" count="1">
408 <element name="GCF_000146045.2" decompress="true"> 422 <element name="GCF_000146045.2" decompress="true">
409 <assert_contents> 423 <assert_contents>
410 <has_text text=">"/> 424 <has_text text="&gt;"/>
411 </assert_contents> 425 </assert_contents>
412 </element> 426 </element>
413 </output_collection> 427 </output_collection>
414 </test> 428 </test>
415 <!-- same as the previous test, but use the default value for decompress, 429 <!-- same as the previous test, but use the default value for decompress,
435 </element> 449 </element>
436 </output_collection> 450 </output_collection>
437 <output_collection name="protein_fasta" type="list" count="1"> 451 <output_collection name="protein_fasta" type="list" count="1">
438 <element name="GCF_000146045.2" ftype="fasta.gz"> 452 <element name="GCF_000146045.2" ftype="fasta.gz">
439 <assert_contents> 453 <assert_contents>
440 <has_size value="1845038" delta="2000"/> 454 <has_size value="1847862" delta="2000"/>
441 </assert_contents> 455 </assert_contents>
442 </element> 456 </element>
443 </output_collection> 457 </output_collection>
444 <output_collection name="rna_fasta" type="list" count="1"> 458 <output_collection name="rna_fasta" type="list" count="1">
445 <element name="GCF_000146045.2" ftype="fasta.gz"> 459 <element name="GCF_000146045.2" ftype="fasta.gz">
461 <param name="include" value="seq-report,genome"/> 475 <param name="include" value="seq-report,genome"/>
462 <param name="decompress" value="true"/> 476 <param name="decompress" value="true"/>
463 </section> 477 </section>
464 <output_collection name="sequence_report" type="list" count="2"/> 478 <output_collection name="sequence_report" type="list" count="2"/>
465 <output_collection name="genome_fasta" type="list:list" count="2"> 479 <output_collection name="genome_fasta" type="list:list" count="2">
466 <expand macro="genome_fasta_assert" el1="GCF_000002945.2" el2="GCF_000002945.2_ASM294v3" expression=">NC_[0-9]+\.[0-9]+ Schizosaccharomyces pombe.*" expression_n="4"/> 480 <expand macro="genome_fasta_assert" el1="GCF_000002945.2" el2="GCF_000002945.2_ASM294v3" expression="&gt;NC_[0-9]+\.[0-9]+ Schizosaccharomyces pombe.*" expression_n="4"/>
467 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc].*" expression_n="17"/> 481 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression="&gt;NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc].*" expression_n="17"/>
468 </output_collection> 482 </output_collection>
469 </test> 483 </test>
470 <!-- tax_exact_match should filter out strains 484 <!-- tax_exact_match should filter out strains
471 https://github.com/ncbi/datasets/issues/187 --> 485 https://github.com/ncbi/datasets/issues/187 -->
472 <test expect_num_outputs="1"> 486 <test expect_num_outputs="2">
473 <conditional name="query|subcommand"> 487 <conditional name="query|subcommand">
474 <param name="download_by" value="taxon"/> 488 <param name="download_by" value="taxon"/>
475 <param name="taxon_positional" value="4932"/> 489 <param name="taxon_positional" value="4932"/>
476 <param name="tax_exact_match" value="true"/> 490 <param name="tax_exact_match" value="true"/>
477 </conditional> 491 </conditional>
478 <param name="include" value=""/> 492 <output name="genome_data_report">
479 <output name="genome_data_report"> 493 <assert_contents>
480 <assert_contents> 494 <has_text text="Saccharomyces cerevisiae ZTW1" negate="true"/>
481 <has_text text="Saccharomyces cerevisiae ZTW1" negate="true"/>
482 </assert_contents> 495 </assert_contents>
483 </output> 496 </output>
484 </test> 497 </test>
485 </tests> 498 </tests>
486 <help> 499 <help>