Mercurial > repos > devteam > data_manager_fetch_ncbi_taxonomy
comparison data_manager/ncbi_taxonomy_fetcher.xml @ 8:2649aece3781 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/data_managers/data_manager_fetch_ncbi_taxonomy commit cf8607692417bdc4f663c726aea34c1056dd9c48
| author | iuc |
|---|---|
| date | Mon, 17 Nov 2025 21:47:03 +0000 |
| parents | 34a5799a65fa |
| children |
comparison
equal
deleted
inserted
replaced
| 7:34a5799a65fa | 8:2649aece3781 |
|---|---|
| 1 <?xml version="1.0"?> | 1 <tool id="ncbi_taxonomy_fetcher" name="NCBI" tool_type="manage_data" version="1.1" profile="24.0"> |
| 2 <tool id="ncbi_taxonomy_fetcher" name="NCBI" tool_type="manage_data" version="1.0.4" profile="23.0"> | |
| 3 <description>taxonomy downloader</description> | 2 <description>taxonomy downloader</description> |
| 4 <requirements> | 3 <requirements> |
| 5 <requirement type="package" version="3.7">python</requirement> | 4 <requirement type="package" version="1.25.0">wget</requirement> |
| 6 </requirements> | 5 </requirements> |
| 7 <command detect_errors="exit_code"> | 6 <command detect_errors="exit_code"> |
| 8 <![CDATA[ | 7 <![CDATA[ |
| 9 python '$__tool_directory__/data_manager.py' --out '${out_file}' | 8 set -o pipefail; |
| 10 #if $taxonomy_url: | 9 |
| 11 --url '${taxonomy_url}' | 10 mkdir -p '$out_file.extra_files_path/taxonomy/' && |
| 11 wget -O - '$taxonomy_url' | tar -xz -C '$out_file.extra_files_path/taxonomy/' && | |
| 12 if [[ ! -f '$out_file.extra_files_path/taxonomy/nodes.dmp' ]]; then >&2 echo "nodes.dmp missing"; exit 1; fi && | |
| 13 | |
| 14 #if $name_maps | |
| 15 mkdir -p '$out_file.extra_files_path/accession2taxid/' && | |
| 16 #if $partial_data | |
| 17 #set files = ['pdb.accession2taxid'] | |
| 18 #else | |
| 19 #set files = ['dead_nucl.accession2taxid', 'dead_prot.accession2taxid', 'dead_wgs.accession2taxid', 'nucl_gb.accession2taxid', 'nucl_wgs.accession2taxid', 'pdb.accession2taxid', 'prot.accession2taxid', 'prot.accession2taxid.FULL'] | |
| 20 #end if | |
| 21 #for file in files | |
| 22 wget -O - ftp://ftp.ncbi.nlm.nih.gov/pub/taxonomy/accession2taxid/${file}.gz | gunzip -c > '$out_file.extra_files_path/accession2taxid/${file}' && | |
| 23 #end for | |
| 12 #end if | 24 #end if |
| 13 #if $database_name: | 25 cp '$dmjson' '$out_file' |
| 14 --name '${database_name}' | |
| 15 #end if | |
| 16 $name_maps | |
| 17 $partial_data | |
| 18 ]]> | 26 ]]> |
| 19 </command> | 27 </command> |
| 28 <configfiles> | |
| 29 <configfile name="dmjson"><![CDATA[#slurp | |
| 30 #if $database_name == "" | |
| 31 #import datetime | |
| 32 #import os.path | |
| 33 #set now = datetime.datetime.now().strftime("%Y-%m-%d-%H%M%S") | |
| 34 #set basename = os.path.basename(str($taxonomy_url))[:-7] | |
| 35 #set value = basename + "_" + now | |
| 36 #set name = basename + " " + now | |
| 37 #else | |
| 38 #set value = $database_name.lower() | |
| 39 #set name = $database_name | |
| 40 #end if | |
| 41 { | |
| 42 "data_tables":{ | |
| 43 "ncbi_taxonomy":[ | |
| 44 { | |
| 45 "value": "$value", | |
| 46 "name": "$name", | |
| 47 "path": "." | |
| 48 } | |
| 49 ] | |
| 50 #if $name_maps | |
| 51 ,"ncbi_accession2taxid":[ | |
| 52 { | |
| 53 "value": "$value", | |
| 54 "name": "$name", | |
| 55 "path": "." | |
| 56 } | |
| 57 ] | |
| 58 #end if | |
| 59 } | |
| 60 }]]></configfile> | |
| 61 </configfiles> | |
| 20 <inputs> | 62 <inputs> |
| 21 <param name="database_name" type="text" optional="true" label="Name for this database" help="Enter a unique identifier, or leave blank for today's date" /> | 63 <param name="database_name" type="text" label="Name for this database" help="Enter a unique identifier, or leave blank for today's date" /> |
| 22 <param name="taxonomy_url" type="text" value='ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz' label="Enter URL for taxonomy files" /> | 64 <param name="taxonomy_url" type="text" value='ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz' label="Enter URL for taxonomy files" /> |
| 23 <param name="name_maps" type="boolean" truevalue="--name-maps" falsevalue="" label="Also download accession2taxid data" checked="false" /> | 65 <param name="name_maps" type="boolean" label="Also download accession2taxid data" checked="false" /> |
| 24 <param name="partial_data" type="hidden" value="" help="Used for testing"/> | 66 <param name="partial_data" type="hidden" value="" help="Used for testing"/> |
| 25 </inputs> | 67 </inputs> |
| 26 <outputs> | 68 <outputs> |
| 27 <data name="out_file" format="data_manager_json" /> | 69 <data name="out_file" format="data_manager_json" /> |
| 28 </outputs> | 70 </outputs> |
| 29 <tests> | 71 <tests> |
| 30 <test> | 72 <test> |
| 31 <param name="database_name" value="tax_name"/> | 73 <param name="database_name" value="tax_name"/> |
| 32 <output name="out_file" value="taxonomy.json"/> | 74 <output name="out_file" value="taxonomy.json"/> |
| 75 </test> | |
| 76 <test> | |
| 77 <output name="out_file"> | |
| 78 <assert_contents> | |
| 79 <has_text_matching expression='"value": "taxdump_\d\d\d\d-\d\d-\d\d-\d\d\d\d\d\d"'/> | |
| 80 <has_text_matching expression='"name": "taxdump \d\d\d\d-\d\d-\d\d-\d\d\d\d\d\d"'/> | |
| 81 </assert_contents> | |
| 82 </output> | |
| 33 </test> | 83 </test> |
| 34 <test> | 84 <test> |
| 35 <param name="database_name" value="tax_name"/> | 85 <param name="database_name" value="tax_name"/> |
| 36 <param name="name_maps" value="true"/> | 86 <param name="name_maps" value="true"/> |
| 37 <param name="partial_data" value="--partial"/> | 87 <param name="partial_data" value="--partial"/> |
