Mercurial > repos > iuc > ncbi_datasets
comparison datasets_genome.xml @ 21:0f3b3813b6ae draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/ncbi_datasets commit c1c3f90e4aa7dc258aa61d98ec4eac0b97eef426
| author | iuc |
|---|---|
| date | Mon, 21 Jul 2025 19:28:16 +0000 |
| parents | da8260eba74b |
| children |
comparison
equal
deleted
inserted
replaced
| 20:7b925f7c50b2 | 21:0f3b3813b6ae |
|---|---|
| 2 <description>download genome sequence, annotation and metadata</description> | 2 <description>download genome sequence, annotation and metadata</description> |
| 3 <macros> | 3 <macros> |
| 4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
| 5 </macros> | 5 </macros> |
| 6 <expand macro="bio_tools"/> | 6 <expand macro="bio_tools"/> |
| 7 <expand macro="requirements"></expand> | 7 <expand macro="requirements"/> |
| 8 <expand macro="version_command"/> | 8 <expand macro="version_command"/> |
| 9 <command><![CDATA[ | 9 <stdio> |
| 10 <regex match="Warning" source="stderr" level="warning" description=""/> | |
| 11 <regex match="skipping" source="stderr" level="warning" description=""/> | |
| 12 <regex match="ERROR" level="fatal"/> | |
| 13 </stdio> | |
| 14 <command detect_errors="exit_code"><![CDATA[ | |
| 10 #import re | 15 #import re |
| 11 @SETUP_CERTIFICATES@ | 16 @SETUP_CERTIFICATES@ |
| 12 datasets download genome $query.subcommand.download_by | 17 datasets download genome $query.subcommand.download_by |
| 13 #if $query.subcommand.download_by == 'accession': | 18 #if $query.subcommand.download_by == 'accession': |
| 14 #if $query.subcommand.text_or_file.text_or_file == 'text': | 19 #if $query.subcommand.text_or_file.text_or_file == 'text': |
| 114 <option value="only" selected="false">Limit to MAGs</option> | 119 <option value="only" selected="false">Limit to MAGs</option> |
| 115 <option value="exclude" selected="false">Exclude MAGs</option> | 120 <option value="exclude" selected="false">Exclude MAGs</option> |
| 116 </param> | 121 </param> |
| 117 <expand macro="released_options"/> | 122 <expand macro="released_options"/> |
| 118 <expand macro="released_options" before_or_after="after"/> | 123 <expand macro="released_options" before_or_after="after"/> |
| 119 | |
| 120 <repeat name="search" title="Add search terms"> | 124 <repeat name="search" title="Add search terms"> |
| 121 <param argument="--search" type="text" label="Only include genomes that have the specified text in the searchable fields" help="Searchable fields are species and infraspecies, assembly name and submitter"/> | 125 <param argument="--search" type="text" label="Only include genomes that have the specified text in the searchable fields" help="Searchable fields are species and infraspecies, assembly name and submitter"/> |
| 122 </repeat> | 126 </repeat> |
| 123 </section> | 127 </section> |
| 124 <section name="file_choices" title="Output options" expanded="true"> | 128 <section name="file_choices" title="Output options" expanded="true"> |
| 135 </section> | 139 </section> |
| 136 </inputs> | 140 </inputs> |
| 137 <outputs> | 141 <outputs> |
| 138 <data name="genome_data_report" format="tabular" label="NCBI Genome Datasets: Data Report" from_work_dir="genome_data_report.tsv"/> | 142 <data name="genome_data_report" format="tabular" label="NCBI Genome Datasets: Data Report" from_work_dir="genome_data_report.tsv"/> |
| 139 <collection name="sequence_report" label="NCBI Genome Datasets: Sequence Data Report" type="list"> | 143 <collection name="sequence_report" label="NCBI Genome Datasets: Sequence Data Report" type="list"> |
| 140 <discover_datasets pattern="(?P<identifier_0>.*?)\/sequence_report.tsv" ext="tabular" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 144 <discover_datasets pattern="(?P<identifier_0>.*?)\/sequence_report.tsv" ext="tabular" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 141 <filter>file_choices['include'] and "seq-report" in file_choices['include']</filter> | 145 <filter>file_choices['include'] and "seq-report" in file_choices['include']</filter> |
| 142 </collection> | 146 </collection> |
| 143 <collection name="genome_fasta" label="NCBI Genome Datasets: genome fasta" type="list:list"> | 147 <collection name="genome_fasta" label="NCBI Genome Datasets: genome fasta" type="list:list"> |
| 144 <discover_datasets pattern="(?P<identifier_0>.*?)/(?!rna|cds_from)(?P<identifier_1>.*?)(_genomic)?\.(?P<ext>fasta(\.gz)?)" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 148 <discover_datasets pattern="(?P<identifier_0>.*?)/(?!rna|cds_from)(?P<identifier_1>.*?)(_genomic)?\.(?P<ext>fasta(\.gz)?)" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 145 <filter>file_choices['include'] and "genome" in file_choices['include']</filter> | 149 <filter>file_choices['include'] and "genome" in file_choices['include']</filter> |
| 146 </collection> | 150 </collection> |
| 147 <collection name="rna_fasta" label="NCBI Genome Datasets: RNA fasta" type="list"> | 151 <collection name="rna_fasta" label="NCBI Genome Datasets: RNA fasta" type="list"> |
| 148 <discover_datasets pattern="(?P<identifier_0>.*?)\/rna\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 152 <discover_datasets pattern="(?P<identifier_0>.*?)\/rna\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 149 <filter>file_choices['include'] and "rna" in file_choices['include']</filter> | 153 <filter>file_choices['include'] and "rna" in file_choices['include']</filter> |
| 150 </collection> | 154 </collection> |
| 151 <collection name="protein_fasta" label="NCBI Genome Datasets: protein fasta" type="list"> | 155 <collection name="protein_fasta" label="NCBI Genome Datasets: protein fasta" type="list"> |
| 152 <discover_datasets pattern="(?P<identifier_0>.*?)\/protein\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 156 <discover_datasets pattern="(?P<identifier_0>.*?)\/protein\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 153 <filter>file_choices['include'] and "protein" in file_choices['include']</filter> | 157 <filter>file_choices['include'] and "protein" in file_choices['include']</filter> |
| 154 </collection> | 158 </collection> |
| 155 <collection name="genomic_cds" label="NCBI Genome Datasets: genomic cds fasta" type="list"> | 159 <collection name="genomic_cds" label="NCBI Genome Datasets: genomic cds fasta" type="list"> |
| 156 <discover_datasets pattern="(?P<identifier_0>.*?)\/cds_from_genomic\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 160 <discover_datasets pattern="(?P<identifier_0>.*?)\/cds_from_genomic\.(?P<ext>fasta(\.gz)?)$" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 157 <filter>file_choices['include'] and "cds" in file_choices['include']</filter> | 161 <filter>file_choices['include'] and "cds" in file_choices['include']</filter> |
| 158 </collection> | 162 </collection> |
| 159 <collection name="genomic_gff" label="NCBI Genome Datasets: genomic gff3" type="list"> | 163 <collection name="genomic_gff" label="NCBI Genome Datasets: genomic gff3" type="list"> |
| 160 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gff" ext="gff3" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 164 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gff" ext="gff3" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 161 <filter>file_choices['include'] and "gff3" in file_choices['include']</filter> | 165 <filter>file_choices['include'] and "gff3" in file_choices['include']</filter> |
| 162 </collection> | 166 </collection> |
| 163 <collection name="genomic_gtf" label="NCBI Genome Datasets: gtf" type="list"> | 167 <collection name="genomic_gtf" label="NCBI Genome Datasets: gtf" type="list"> |
| 164 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gtf" ext="gtf" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 168 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gtf" ext="gtf" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 165 <filter>file_choices['include'] and "gtf" in file_choices['include']</filter> | 169 <filter>file_choices['include'] and "gtf" in file_choices['include']</filter> |
| 166 </collection> | 170 </collection> |
| 167 <collection name="genomic_gbff" label="NCBI Genome Datasets: GenBank flatfile" type="list"> | 171 <collection name="genomic_gbff" label="NCBI Genome Datasets: GenBank flatfile" type="list"> |
| 168 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gbff" ext="txt" directory="ncbi_dataset/data" recurse="true" match_relative_path="true"/> | 172 <discover_datasets pattern="(?P<identifier_0>.*?)\/genomic\.gbff" ext="txt" directory="ncbi_dataset/data/" recurse="true" match_relative_path="true"/> |
| 169 <filter>file_choices['include'] and "gbff" in file_choices['include']</filter> | 173 <filter>file_choices['include'] and "gbff" in file_choices['include']</filter> |
| 170 </collection> | 174 </collection> |
| 171 </outputs> | 175 </outputs> |
| 172 <tests> | 176 <tests> |
| 173 <test expect_num_outputs="3"> | 177 <test expect_num_outputs="3"> |
| 174 <conditional name="query|subcommand"> | 178 <conditional name="query|subcommand"> |
| 175 <param name="download_by" value="taxon"/> | 179 <param name="download_by" value="taxon"/> |
| 176 <param name="taxon_positional" value="human"/> | 180 <param name="taxon_positional" value="human"/> |
| 177 </conditional> | 181 </conditional> |
| 178 <param name="chromosomes" value="21"/> | 182 <section name="filters"> |
| 179 <param name="released_before" value="01/01/2018"/> | 183 <param name="chromosomes" value="21"/> |
| 184 <param name="released_before" value="01/01/2018"/> | |
| 185 </section> | |
| 180 <section name="file_choices"> | 186 <section name="file_choices"> |
| 181 <!-- include a sequence (which should be downloaded as fasta.gz) | 187 <!-- include a sequence (which should be downloaded as fasta.gz) |
| 182 and one non-sequence (which should be decompressed) output --> | 188 and one non-sequence (which should be decompressed) output --> |
| 183 <param name="include" value="rna,gff3"/> | 189 <param name="include" value="rna,gff3"/> |
| 184 </section> | 190 </section> |
| 185 <output name="genome_data_report"> | 191 <output name="genome_data_report"> |
| 186 <assert_contents> | 192 <assert_contents> |
| 187 <has_text text="Assembly Accession	Assembly Name	Assembly Submitter	Organism Name"/> | 193 <has_text text="Assembly Accession	Assembly Name	Assembly Submitter	Organism Name"/> |
| 188 <has_n_lines n="142"/> | 194 <has_n_lines n="142"/> |
| 189 <has_n_columns n="4"/> | 195 <has_n_columns n="4"/> |
| 190 </assert_contents> | 196 </assert_contents> |
| 191 </output> | 197 </output> |
| 192 <output_collection name="rna_fasta" type="list" count="1"> | 198 <output_collection name="rna_fasta" type="list" count="2"> |
| 193 <element name="GCF_000306695.2" decompress="true"> | 199 <element name="GCF_000306695.2" decompress="true"> |
| 194 <assert_contents> | 200 <assert_contents> |
| 195 <has_text text=">"/> | 201 <has_text text=">"/> |
| 196 </assert_contents> | 202 </assert_contents> |
| 197 </element> | 203 </element> |
| 198 </output_collection> | 204 </output_collection> |
| 199 <output_collection name="genomic_gff" type="list"> | 205 <output_collection name="genomic_gff" type="list" count="12"> |
| 200 <element name="GCF_000306695.2"> | 206 <element name="GCF_000306695.2"> |
| 201 <assert_contents> | 207 <assert_contents> |
| 202 <has_n_lines min="1000000"/> | 208 <has_n_lines min="1000000"/> |
| 203 <has_line line="##gff-version 3"/> | 209 <has_line line="##gff-version 3"/> |
| 204 <has_n_columns n="9" comment="#"/> | 210 <has_n_columns n="9" comment="#"/> |
| 212 <test expect_num_outputs="2"> | 218 <test expect_num_outputs="2"> |
| 213 <conditional name="query|subcommand"> | 219 <conditional name="query|subcommand"> |
| 214 <param name="download_by" value="taxon"/> | 220 <param name="download_by" value="taxon"/> |
| 215 <param name="taxon_positional" value="human"/> | 221 <param name="taxon_positional" value="human"/> |
| 216 </conditional> | 222 </conditional> |
| 217 <param name="chromosomes" value="21"/> | 223 <section name="filters"> |
| 218 <param name="assembly_level" value="chromosome,complete"/> | 224 <param name="chromosomes" value="21"/> |
| 219 <param name="released_before" value="01/01/2018"/> | 225 <param name="assembly_level" value="chromosome,complete"/> |
| 226 <param name="released_before" value="01/01/2018"/> | |
| 227 </section> | |
| 220 <section name="file_choices"> | 228 <section name="file_choices"> |
| 221 <param name="include" value="genome"/> | 229 <param name="include" value="genome"/> |
| 222 <param name="decompress" value="true"/> | 230 <param name="decompress" value="true"/> |
| 223 </section> | 231 </section> |
| 224 <output_collection name="genome_fasta" type="list:list" count="12"> | 232 <output_collection name="genome_fasta" type="list:list" count="11"> |
| 225 <expand macro="genome_fasta_assert" el1="GCA_000002115.2" el2="chr21" expression=">"/> | 233 <expand macro="genome_fasta_assert" el1="GCA_000002115.2" el2="chr21" expression=">"/> |
| 226 <expand macro="genome_fasta_assert" el1="GCA_000002125.2" el2="chr21" expression=">"/> | 234 <expand macro="genome_fasta_assert" el1="GCA_000002125.2" el2="chr21" expression=">"/> |
| 227 <expand macro="genome_fasta_assert" el1="GCA_000212995.1" el2="chr21" expression=">"/> | 235 <expand macro="genome_fasta_assert" el1="GCA_000212995.1" el2="chr21" expression=">"/> |
| 228 <expand macro="genome_fasta_assert" el1="GCA_000252825.1" el2="chr21" expression=">"/> | 236 <expand macro="genome_fasta_assert" el1="GCA_000306695.2" el2="chr21" expression=">"/> |
| 229 <expand macro="genome_fasta_assert" el1="GCA_000306695.2" el2="chr21" expression=">"/> | 237 <expand macro="genome_fasta_assert" el1="GCA_000365445.1" el2="chr21" expression=">"/> |
| 230 <expand macro="genome_fasta_assert" el1="GCA_000365445.1" el2="chr21" expression=">"/> | 238 <expand macro="genome_fasta_assert" el1="GCA_001292825.2" el2="chr21" expression=">"/> |
| 231 <expand macro="genome_fasta_assert" el1="GCA_001292825.2" el2="chr21" expression=">"/> | 239 <expand macro="genome_fasta_assert" el1="GCA_001524155.4" el2="chr21" expression=">"/> |
| 232 <expand macro="genome_fasta_assert" el1="GCA_001524155.4" el2="chr21" expression=">"/> | 240 <expand macro="genome_fasta_assert" el1="GCA_001712695.1" el2="chr21" expression=">"/> |
| 233 <expand macro="genome_fasta_assert" el1="GCA_001712695.1" el2="chr21" expression=">"/> | 241 <expand macro="genome_fasta_assert" el1="GCA_022833125.2" el2="chr21" expression=">"/> |
| 234 <expand macro="genome_fasta_assert" el1="GCA_022833125.2" el2="chr21" expression=">"/> | 242 <expand macro="genome_fasta_assert" el1="GCF_000002125.1" el2="chr21" expression=">"/> |
| 235 <expand macro="genome_fasta_assert" el1="GCF_000002125.1" el2="chr21" expression=">"/> | 243 <expand macro="genome_fasta_assert" el1="GCF_000306695.2" el2="chr21" expression=">"/> |
| 236 <expand macro="genome_fasta_assert" el1="GCF_000306695.2" el2="chr21" expression=">"/> | |
| 237 <!-- According to https://github.com/ncbi/datasets/issues/188, the following should not be included among the returned results anymore 09/2023 --> | 244 <!-- According to https://github.com/ncbi/datasets/issues/188, the following should not be included among the returned results anymore 09/2023 --> |
| 238 <!-- | 245 <!-- |
| 239 <expand macro="genome_fasta_assert" el1="GCA_000442335.2" el2="GCA_000442335.2_LinearCen1.1_normalized" expression=">" expression_n="25"/> | 246 <expand macro="genome_fasta_assert" el1="GCA_000442335.2" el2="GCA_000442335.2_LinearCen1.1_normalized" expression=">" expression_n="25"/> |
| 240 <expand macro="genome_fasta_assert" el1="GCA_000002135.3" el2="GCA_000002135.3_CRA_TCAGchr7v2" expression=">"/> | 247 <expand macro="genome_fasta_assert" el1="GCA_000002135.3" el2="GCA_000002135.3_CRA_TCAGchr7v2" expression=">"/> |
| 241 --> | 248 --> |
| 251 <test expect_failure="true"> | 258 <test expect_failure="true"> |
| 252 <conditional name="query|subcommand"> | 259 <conditional name="query|subcommand"> |
| 253 <param name="download_by" value="taxon"/> | 260 <param name="download_by" value="taxon"/> |
| 254 <param name="taxon_positional" value="human"/> | 261 <param name="taxon_positional" value="human"/> |
| 255 </conditional> | 262 </conditional> |
| 256 <param name="chromosomes" value="21"/> | 263 <section name="filters"> |
| 257 <param name="assembly_level" value="chromosome,complete"/> | 264 <param name="chromosomes" value="21"/> |
| 258 <param name="assembly_source" value="refseq"/> | 265 <param name="assembly_level" value="chromosome,complete"/> |
| 259 <param name="released_before" value="01/01/2018"/> | 266 <param name="assembly_source" value="refseq"/> |
| 267 <param name="released_before" value="01/01/2018"/> | |
| 268 </section> | |
| 260 <section name="file_choices"> | 269 <section name="file_choices"> |
| 261 <param name="include" value="genome"/> | 270 <param name="include" value="genome"/> |
| 262 <param name="decompress" value="true"/> | 271 <param name="decompress" value="true"/> |
| 263 </section> | 272 </section> |
| 264 <assert_stderr> | 273 <assert_stderr> |
| 286 <conditional name="text_or_file"> | 295 <conditional name="text_or_file"> |
| 287 <param name="text_or_file" value="text"/> | 296 <param name="text_or_file" value="text"/> |
| 288 <param name="accession" value="GCF_000013305.1 GCF_000007445.1"/> | 297 <param name="accession" value="GCF_000013305.1 GCF_000007445.1"/> |
| 289 </conditional> | 298 </conditional> |
| 290 </conditional> | 299 </conditional> |
| 291 <param name="released_before" value="01/01/2007"/> | 300 <section name="filters"> |
| 301 <param name="released_before" value="01/01/2007"/> | |
| 302 </section> | |
| 292 <section name="file_choices"> | 303 <section name="file_choices"> |
| 293 <param name="include" value="seq-report,gtf,cds"/> | 304 <param name="include" value="seq-report,gtf,cds"/> |
| 294 <param name="decompress" value="true"/> | 305 <param name="decompress" value="true"/> |
| 295 </section> | 306 </section> |
| 296 <output name="genome_data_report"> | 307 <output name="genome_data_report"> |
| 298 <has_text text="GCF_000013305.1"/> | 309 <has_text text="GCF_000013305.1"/> |
| 299 <has_n_lines n="3"/> | 310 <has_n_lines n="3"/> |
| 300 <has_n_columns n="4"/> | 311 <has_n_columns n="4"/> |
| 301 </assert_contents> | 312 </assert_contents> |
| 302 </output> | 313 </output> |
| 303 <output_collection name="sequence_report" type="list" count="2" > | 314 <output_collection name="sequence_report" type="list" count="2"> |
| 304 <element name="GCF_000007445.1"> | 315 <element name="GCF_000007445.1"> |
| 305 <assert_contents> | 316 <assert_contents> |
| 306 <has_text text="GCF_000007445.1"/> | 317 <has_text text="GCF_000007445.1"/> |
| 307 <has_n_lines n="2"/> | 318 <has_n_lines n="2"/> |
| 308 <has_n_columns n="15"/> | 319 <has_n_columns n="15"/> |
| 314 <has_n_lines n="2"/> | 325 <has_n_lines n="2"/> |
| 315 <has_n_columns n="15"/> | 326 <has_n_columns n="15"/> |
| 316 </assert_contents> | 327 </assert_contents> |
| 317 </element> | 328 </element> |
| 318 </output_collection> | 329 </output_collection> |
| 319 <output_collection name="genomic_gtf" type="list"> | 330 <output_collection name="genomic_gtf" type="list" count="2"> |
| 320 <element name="GCF_000007445.1" file="GCF_000007445.1.genomic.gtf" compare="contains"/> | 331 <element name="GCF_000007445.1" file="GCF_000007445.1.genomic.gtf" compare="contains"/> |
| 321 <element name="GCF_000013305.1" file="genome.2.GCF_000013305.1.genomic.gtf" compare="contains"/> | 332 <element name="GCF_000013305.1" file="genome.2.GCF_000013305.1.genomic.gtf" compare="contains"/> |
| 322 </output_collection> | 333 </output_collection> |
| 323 <output_collection name="genomic_cds" type="list"> | 334 <output_collection name="genomic_cds" type="list"> |
| 324 <element name="GCF_000007445.1" file="genome.2.GCF_000007445.1.genomic.cds" compare="contains"/> | 335 <element name="GCF_000007445.1" file="genome.2.GCF_000007445.1.genomic.cds" compare="contains"/> |
| 331 <conditional name="text_or_file"> | 342 <conditional name="text_or_file"> |
| 332 <param name="text_or_file" value="file"/> | 343 <param name="text_or_file" value="file"/> |
| 333 <param name="inputfile" value="accessions.txt"/> | 344 <param name="inputfile" value="accessions.txt"/> |
| 334 </conditional> | 345 </conditional> |
| 335 </conditional> | 346 </conditional> |
| 336 <param name="released_before" value="01/01/2007"/> | 347 <section name="filters"> |
| 348 <param name="released_before" value="01/01/2007"/> | |
| 349 </section> | |
| 337 <section name="file_choices"> | 350 <section name="file_choices"> |
| 338 <param name="include" value="seq-report,gff3,gbff"/> | 351 <param name="include" value="seq-report,gff3,gbff"/> |
| 339 <param name="decompress" value="true"/> | 352 <param name="decompress" value="true"/> |
| 340 </section> | 353 </section> |
| 341 <output name="genome_data_report"> | 354 <output name="genome_data_report"> |
| 353 <output_collection name="genomic_gbff" type="list"> | 366 <output_collection name="genomic_gbff" type="list"> |
| 354 <element name="GCF_000007445.1" file="genome.3.GCF_000007445.1.genomic.gbff" compare="contains"/> | 367 <element name="GCF_000007445.1" file="genome.3.GCF_000007445.1.genomic.gbff" compare="contains"/> |
| 355 <element name="GCF_000013305.1" file="genome.3.GCF_000013305.1.genomic.gbff" compare="contains"/> | 368 <element name="GCF_000013305.1" file="genome.3.GCF_000013305.1.genomic.gbff" compare="contains"/> |
| 356 </output_collection> | 369 </output_collection> |
| 357 </test> | 370 </test> |
| 358 | |
| 359 <!-- should not fail https://github.com/ncbi/datasets/issues/194 --> | 371 <!-- should not fail https://github.com/ncbi/datasets/issues/194 --> |
| 360 <test expect_num_outputs="2"> | 372 <test expect_num_outputs="2"> |
| 361 <conditional name="query|subcommand"> | 373 <conditional name="query|subcommand"> |
| 362 <param name="download_by" value="accession"/> | 374 <param name="download_by" value="accession"/> |
| 363 <conditional name="text_or_file"> | 375 <conditional name="text_or_file"> |
| 364 <param name="text_or_file" value="text"/> | 376 <param name="text_or_file" value="text"/> |
| 365 <param name="accession" value="GCF_000001405"/> | 377 <param name="accession" value="GCF_000001405"/> |
| 366 </conditional> | 378 </conditional> |
| 367 </conditional> | 379 </conditional> |
| 368 <param name="released_before" value="01/01/2015"/> | 380 <section name="filters"> |
| 369 <param name="assembly_version" value="all"/> | 381 <param name="released_before" value="01/01/2015"/> |
| 382 <param name="assembly_version" value="all"/> | |
| 383 </section> | |
| 370 <section name="file_choices"> | 384 <section name="file_choices"> |
| 371 <param name="include" value="seq-report"/> | 385 <param name="include" value="seq-report"/> |
| 372 </section> | 386 </section> |
| 373 <output name="genome_data_report"> | 387 <output name="genome_data_report"> |
| 374 <!-- assert that we get at least the 16 versions available at the time of writing this test --> | 388 <!-- assert that we get at least the 16 versions available at the time of writing this test --> |
| 393 <section name="file_choices"> | 407 <section name="file_choices"> |
| 394 <param name="include" value="genome,protein,rna,cds"/> | 408 <param name="include" value="genome,protein,rna,cds"/> |
| 395 <param name="decompress" value="true"/> | 409 <param name="decompress" value="true"/> |
| 396 </section> | 410 </section> |
| 397 <output_collection name="genome_fasta" type="list:list" count="1"> | 411 <output_collection name="genome_fasta" type="list:list" count="1"> |
| 398 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc] (mitochondrion|chromosome .*), complete (sequence|genome)" expression_n="17"/> | 412 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc] (mitochondrion|chromosome .*), complete (sequence|genome)" expression_n="17"/> |
| 399 </output_collection> | 413 </output_collection> |
| 400 <output_collection name="protein_fasta" type="list" count="1"> | 414 <output_collection name="protein_fasta" type="list" count="1"> |
| 401 <element name="GCF_000146045.2" decompress="true"> | 415 <element name="GCF_000146045.2" decompress="true"> |
| 402 <assert_contents> | 416 <assert_contents> |
| 403 <has_text text=">"/> | 417 <has_text text=">"/> |
| 404 </assert_contents> | 418 </assert_contents> |
| 405 </element> | 419 </element> |
| 406 </output_collection> | 420 </output_collection> |
| 407 <output_collection name="rna_fasta" type="list" count="1"> | 421 <output_collection name="rna_fasta" type="list" count="1"> |
| 408 <element name="GCF_000146045.2" decompress="true"> | 422 <element name="GCF_000146045.2" decompress="true"> |
| 409 <assert_contents> | 423 <assert_contents> |
| 410 <has_text text=">"/> | 424 <has_text text=">"/> |
| 411 </assert_contents> | 425 </assert_contents> |
| 412 </element> | 426 </element> |
| 413 </output_collection> | 427 </output_collection> |
| 414 </test> | 428 </test> |
| 415 <!-- same as the previous test, but use the default value for decompress, | 429 <!-- same as the previous test, but use the default value for decompress, |
| 435 </element> | 449 </element> |
| 436 </output_collection> | 450 </output_collection> |
| 437 <output_collection name="protein_fasta" type="list" count="1"> | 451 <output_collection name="protein_fasta" type="list" count="1"> |
| 438 <element name="GCF_000146045.2" ftype="fasta.gz"> | 452 <element name="GCF_000146045.2" ftype="fasta.gz"> |
| 439 <assert_contents> | 453 <assert_contents> |
| 440 <has_size value="1845038" delta="2000"/> | 454 <has_size value="1847862" delta="2000"/> |
| 441 </assert_contents> | 455 </assert_contents> |
| 442 </element> | 456 </element> |
| 443 </output_collection> | 457 </output_collection> |
| 444 <output_collection name="rna_fasta" type="list" count="1"> | 458 <output_collection name="rna_fasta" type="list" count="1"> |
| 445 <element name="GCF_000146045.2" ftype="fasta.gz"> | 459 <element name="GCF_000146045.2" ftype="fasta.gz"> |
| 461 <param name="include" value="seq-report,genome"/> | 475 <param name="include" value="seq-report,genome"/> |
| 462 <param name="decompress" value="true"/> | 476 <param name="decompress" value="true"/> |
| 463 </section> | 477 </section> |
| 464 <output_collection name="sequence_report" type="list" count="2"/> | 478 <output_collection name="sequence_report" type="list" count="2"/> |
| 465 <output_collection name="genome_fasta" type="list:list" count="2"> | 479 <output_collection name="genome_fasta" type="list:list" count="2"> |
| 466 <expand macro="genome_fasta_assert" el1="GCF_000002945.2" el2="GCF_000002945.2_ASM294v3" expression=">NC_[0-9]+\.[0-9]+ Schizosaccharomyces pombe.*" expression_n="4"/> | 480 <expand macro="genome_fasta_assert" el1="GCF_000002945.2" el2="GCF_000002945.2_ASM294v3" expression=">NC_[0-9]+\.[0-9]+ Schizosaccharomyces pombe.*" expression_n="4"/> |
| 467 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc].*" expression_n="17"/> | 481 <expand macro="genome_fasta_assert" el1="GCF_000146045.2" el2="GCF_000146045.2_R64" expression=">NC_[0-9]+\.[0-9]+ Saccharomyces cerevisiae S288[Cc].*" expression_n="17"/> |
| 468 </output_collection> | 482 </output_collection> |
| 469 </test> | 483 </test> |
| 470 <!-- tax_exact_match should filter out strains | 484 <!-- tax_exact_match should filter out strains |
| 471 https://github.com/ncbi/datasets/issues/187 --> | 485 https://github.com/ncbi/datasets/issues/187 --> |
| 472 <test expect_num_outputs="1"> | 486 <test expect_num_outputs="2"> |
| 473 <conditional name="query|subcommand"> | 487 <conditional name="query|subcommand"> |
| 474 <param name="download_by" value="taxon"/> | 488 <param name="download_by" value="taxon"/> |
| 475 <param name="taxon_positional" value="4932"/> | 489 <param name="taxon_positional" value="4932"/> |
| 476 <param name="tax_exact_match" value="true"/> | 490 <param name="tax_exact_match" value="true"/> |
| 477 </conditional> | 491 </conditional> |
| 478 <param name="include" value=""/> | 492 <output name="genome_data_report"> |
| 479 <output name="genome_data_report"> | 493 <assert_contents> |
| 480 <assert_contents> | 494 <has_text text="Saccharomyces cerevisiae ZTW1" negate="true"/> |
| 481 <has_text text="Saccharomyces cerevisiae ZTW1" negate="true"/> | |
| 482 </assert_contents> | 495 </assert_contents> |
| 483 </output> | 496 </output> |
| 484 </test> | 497 </test> |
| 485 </tests> | 498 </tests> |
| 486 <help> | 499 <help> |
