comparison data_manager/data_manager_mmseqs2_download.xml @ 0:75cc3fb4c10f draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/data_managers/data_manager_mmseqs2_database commit 1400593429eb4e9c6e307df3621825a8b84a6fa7
author iuc
date Thu, 27 Mar 2025 14:37:32 +0000
parents
children 35885ec2e59b
comparison
equal deleted inserted replaced
-1:000000000000 0:75cc3fb4c10f
1 <tool id="data_manager_mmseqs2_download" name="Download MMseqs2 databases" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" tool_type="manage_data" profile="22.05">
2 <description></description>
3 <macros>
4 <token name="@TOOL_VERSION@">15.6f452</token>
5 <token name="@VERSION_SUFFIX@">0</token>
6 </macros>
7 <requirements>
8 <requirement type="package" version="@TOOL_VERSION@">mmseqs2</requirement>
9 </requirements>
10 <command detect_errors="exit_code"><![CDATA[
11 #set $database_name = str($database).split('/')[-1] if '/' in str($database) else str($database)
12
13 mkdir -p '$out_file.extra_files_path'/'$database_name' &&
14 mmseqs databases
15 '$database' '$out_file.extra_files_path'/'$database_name'/database
16 'tmp'
17 --threads "\${GALAXY_SLOTS:-1}" &&
18 cp '$dmjson' '$out_file'
19 ]]></command>
20 <configfiles>
21 <configfile name="dmjson"><![CDATA[
22 #from datetime import date
23 #set $database_name = str($database).split('/')[-1] if '/' in str($database) else str($database)
24 {
25 "data_tables":{
26 "mmseqs2_databases":[
27 {
28 "value": "${database}-@TOOL_VERSION@-#echo date.today().strftime('%d%m%Y')#",
29 "name": "${database} #echo date.today().strftime('%d%m%Y')#",
30 "type": "${db_type}",
31 "taxonomy": "${db_taxonomy}",
32 "path": "$database_name",
33 "version": "@TOOL_VERSION@"
34 }
35 ]
36 }
37 }]]>
38 </configfile>
39 </configfiles>
40 <inputs>
41 <conditional name="db_name">
42 <param argument="type" type="select" label="Type of Databases">
43 <option value="aminoacid">Aminoacid databases</option>
44 <option value="aminoacid_taxonomy">Aminoacid databases that can be used for taxonomy</option>
45 <option value="nucleotide">Nucleotide databases</option>
46 <option value="nucleotide_taxonomy">Nucleotide databases that can be used for taxonomy</option>
47 <option value="profile">Profile databases</option>
48 </param>
49 <when value="aminoacid">
50 <param name="db_type" value="aminoacid" type="hidden"/>
51 <param name="db_taxonomy" value="no" type="hidden"/>
52 <param name="database" type="select" label="MMseqs2 aminoacid databases">
53 <option value="UniRef100" selected="true">UniRef100</option>
54 <option value="UniRef90">UniRef90</option>
55 <option value="UniRef50">UniRef50</option>
56 <option value="UniProtKB">UniProtKB</option>
57 <option value="UniProtKB/TrEMBL">TrEMBL (UniProtKB)</option>
58 <option value="UniProtKB/Swiss-Prot">Swiss-Prot (UniProtKB)</option>
59 <option value="NR">NR (Non-redundant protein sequences from GenPept, Swissprot, PIR, PDF, PDB, and NCBI RefSeq)</option>
60 <option value="GTDB">GTDB (Genome Taxonomy Database)</option>
61 <option value="PDB">PDB (The Protein Data Bank)</option>
62 </param>
63 </when>
64 <when value="aminoacid_taxonomy">
65 <param name="db_type" value="aminoacid" type="hidden"/>
66 <param name="db_taxonomy" value="yes" type="hidden"/>
67 <param name="database" type="select" label="MMseqs2 aminoacid databases that can be used for taxonomy">
68 <option value="UniRef100" selected="true">UniRef100</option>
69 <option value="UniRef90">UniRef90</option>
70 <option value="UniRef50">UniRef50</option>
71 <option value="UniProtKB">UniProtKB</option>
72 <option value="UniProtKB/TrEMBL">TrEMBL (UniProtKB)</option>
73 <option value="UniProtKB/Swiss-Prot">Swiss-Prot (UniProtKB)</option>
74 <option value="NR">NR (Non-redundant protein sequences from GenPept, Swissprot, PIR, PDF, PDB, and NCBI RefSeq)</option>
75 <option value="GTDB">GTDB (Genome Taxonomy Database)</option>
76 </param>
77 </when>
78 <when value="nucleotide">
79 <param name="db_type" value="nucleotide" type="hidden"/>
80 <param name="db_taxonomy" value="no" type="hidden"/>
81 <param name="database" type="select" label="MMseqs2 nucleotide databases">
82 <option value="SILVA">SILVA</option>
83 <option value="Kalamari">Kalamari</option>
84 <option value="NT">NT (Partially non-redundant nucleotide sequences from all traditional divisions of GenBank, EMBL, and DDBJ excluding GSS, STS, PAT, EST, HTG, and WGS)</option>
85 <option value="Resfinder">Resfinder</option>
86 </param>
87 </when>
88 <when value="nucleotide_taxonomy">
89 <param name="db_type" value="nucleotide" type="hidden"/>
90 <param name="db_taxonomy" value="yes" type="hidden"/>
91 <param name="database" type="select" label="MMseqs2 nucleotide databases that can be used for taxonomy">
92 <option value="SILVA">SILVA</option>
93 <option value="Kalamari">Kalamari</option>
94 </param>
95 </when>
96 <when value="profile">
97 <param name="db_type" value="profile" type="hidden"/>
98 <param name="db_taxonomy" value="no" type="hidden"/>
99 <param name="database" type="select" label="MMseqs2 profile databases">
100 <option value="PDB70">PDB70 (PDB clustered to 70% sequence identity)</option>
101 <option value="Pfam-A.full">Pfam-A.full</option>
102 <option value="Pfam-A.seed">Pfam-A.seed</option>
103 <option value="Pfam-B">Pfam-B</option>
104 <option value="CDD">CDD (Conserved Domain Database)</option>
105 <option value="VOGDB">VOGDB (Virus Orthologous Groups)</option>
106 <option value="dbCAN2">dbCAN2 (database of carbohydrate-active enzymes)</option>
107 </param>
108 </when>
109 </conditional>
110 </inputs>
111 <outputs>
112 <data name="out_file" format="data_manager_json" label="${tool.name}"/>
113 </outputs>
114 <tests>
115 <test expect_num_outputs="1">
116 <conditional name="db_name">
117 <param name="type" value="nucleotide_taxonomy" />
118 <param name="db_type" value="nucleotide" />
119 <param name="db_taxonomy" value="yes" />
120 <param name="database" value="SILVA" />
121 </conditional>
122 <output name="out_file">
123 <assert_contents>
124 <has_text text='"mmseqs2_databases":'/>
125 <has_text text='"version": "15.6f452"'/>
126 <has_text_matching expression='"value": "SILVA-15.6f452-[0-9]{8}"'/>
127 <has_text_matching expression='"name": "SILVA [0-9]{8}"'/>
128 <has_text text='"type": "nucleotide"'/>
129 <has_text text='"taxonomy": "yes"'/>
130 <has_text text='"path": "SILVA"'/>
131 </assert_contents>
132 </output>
133 </test>
134 <test expect_num_outputs="1">
135 <conditional name="db_name">
136 <param name="type" value="aminoacid_taxonomy" />
137 <param name="db_type" value="aminoacid" />
138 <param name="db_taxonomy" value="yes" />
139 <param name="database" value="UniProtKB/Swiss-Prot" />
140 </conditional>
141 <output name="out_file">
142 <assert_contents>
143 <has_text text='"mmseqs2_databases":'/>
144 <has_text text='"version": "15.6f452"'/>
145 <has_text_matching expression='"value": "UniProtKB/Swiss-Prot-15.6f452-[0-9]{8}"'/>
146 <has_text_matching expression='"name": "UniProtKB/Swiss-Prot [0-9]{8}"'/>
147 <has_text text='"type": "aminoacid"'/>
148 <has_text text='"taxonomy": "yes"'/>
149 <has_text text='"path": "Swiss-Prot"'/>
150 </assert_contents>
151 </output>
152 </test>
153 </tests>
154 <help><![CDATA[
155 This tool downloads databases that can be used with MMseqs2.
156 ]]></help>
157 <citations>
158 <citation type="doi">10.1038/nbt.3988</citation>
159 </citations>
160 </tool>