Mercurial > repos > galaxyp > dbbuilder
comparison dbbuilder.xml @ 8:a85fbebe8b2f draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/dbbuilder commit baa8095b41984515948c6ef2fda7c7e61c945f94
author | galaxyp |
---|---|
date | Wed, 03 May 2017 09:53:17 -0400 |
parents | a94dc3d469cb |
children | c1b437242fee |
comparison
equal
deleted
inserted
replaced
7:a94dc3d469cb | 8:a85fbebe8b2f |
---|---|
1 <tool id="dbbuilder" name="Protein Database Downloader" version="0.2.1"> | 1 <tool id="dbbuilder" name="Protein Database Downloader" version="0.3.0"> |
2 <description></description> | 2 <description></description> |
3 <requirements> | 3 <requirements> |
4 <requirement type="package">gnu-wget</requirement> | 4 <requirement type="package">gnu-wget</requirement> |
5 </requirements> | 5 </requirements> |
6 <stdio> | 6 <stdio> |
18 #set $type = "direct" | 18 #set $type = "direct" |
19 #elif $source.from == "cRAP" | 19 #elif $source.from == "cRAP" |
20 ##set $url = "ftp://ftp.thegpm.org/fasta/cRAP/crap.fasta" | 20 ##set $url = "ftp://ftp.thegpm.org/fasta/cRAP/crap.fasta" |
21 #set $url = "https://raw.githubusercontent.com/pravs3683/cRAP/master/cRAP_protein_database.fasta" | 21 #set $url = "https://raw.githubusercontent.com/pravs3683/cRAP/master/cRAP_protein_database.fasta" |
22 #set $type = "direct" | 22 #set $type = "direct" |
23 #elif $source.from == "HMP" | |
24 #set $url = 'http://downloads.hmpdacc.org/data/reference_genomes/body_sites/' + str($source.site) + '.pep.fsa' | |
25 #set $type = "direct" | |
26 #elif $source.from == "HOMD" | |
27 #set $url = 'ftp://ftp.homd.org/human_oral_microbial_genomic_sequences/current/' + str($source.annotation) | |
28 #if str($source.annotation).endswith('.tar.gz'): | |
29 #set $type = "tgz" | |
30 #elif str($source.annotation).endswith('.zip'): | |
31 #set $type = "zip" | |
32 #end if | |
33 #elif $source.from == 'EBI Metagenomics' | |
34 #set $url = 'https://www.ebi.ac.uk/metagenomics/projects/' + str($source.ebi_project) + '/samples/' + str($source.ebi_sample) + '/runs/' + str($source.ebi_run) + '/results/versions/' + str($source.ebi_version) + '/sequences/' + str($source.ebi_annotation) + '/chunks/1' | |
35 #set $type = "gzip" | |
23 #elif $source.from == "url" | 36 #elif $source.from == "url" |
24 #set $url = $source.url | 37 #set $url = $source.url |
25 #set $type = "direct" | 38 #set $type = $source.archive_type |
26 #end if | 39 #end if |
27 #if $type =="direct" | 40 #if $type =="direct" |
28 wget -nv '$url' -O '${output_database}' | 41 wget -nv '$url' -O '${output_database}' --no-check-certificate |
42 #elif $type =="zip" | |
43 wget -nv '$url' -O tmp.zip --no-check-certificate && zcat -c tmp.zip > '${output_database}' | |
44 #elif $type =="gzip" | |
45 wget -nv '$url' -O tmp.gz --no-check-certificate && (if `command -v gzcat > /dev/null`; then gzcat tmp.gz; else zcat tmp.gz ; fi) > '${output_database}' | |
46 #elif $type =="bzip2" | |
47 wget -nv '$url' -O tmp.bz2 --no-check-certificate && bzcat tmp.bz2 > '${output_database}' | |
48 #elif $type =="tgz" | |
49 wget -nv '$url' -O tmp.tar.gz && tar zxfO tmp.tar.gz > '${output_database}' | |
50 #elif $type =="tbz" | |
51 wget -nv '$url' -O tmp.tar.bz && tar jxfO tmp.tar.bz > '${output_database}' | |
29 #end if | 52 #end if |
30 ]]> | 53 ]]> |
31 </command> | 54 </command> |
32 <inputs> | 55 <inputs> |
33 <conditional name="source"> | 56 <conditional name="source"> |
34 <param name="from" type="select" label="Download from" help="Select database source. cRAP acts as a database for common MS contaminants. UniProtKB is a corss species collection of functional protein databases"> | 57 <param name="from" type="select" label="Download from" help="Select database source. cRAP acts as a database for common MS contaminants. UniProtKB is a cross species collection of functional protein databases"> |
35 <option value="uniprot">UniProtKB</option> | 58 <option value="uniprot">UniProtKB</option> |
36 <option value="cRAP">cRAP (contaminants)</option> | 59 <option value="cRAP">cRAP (contaminants)</option> |
60 <option value="HMP">Human Microbiome Project body sites</option> | |
61 <option value="EBI Metagenomics">EBI Metagenomics</option> | |
62 <option value="HOMD">Human Oral Microbiome Database (HOMD)</option> | |
37 <option value="url">Custom URL</option> | 63 <option value="url">Custom URL</option> |
38 </param> | 64 </param> |
39 <when value="uniprot"> | 65 <when value="uniprot"> |
40 <param name="taxon" type="select" format="text" help="select species for protein database"> | 66 <param name="taxon" type="select" format="text" help="select species for protein database"> |
41 <label>Taxonomy</label> | 67 <label>Taxonomy</label> |
65 </sanitizer> | 91 </sanitizer> |
66 </param> | 92 </param> |
67 <param name="include_isoform" type="boolean" truevalue="&include=yes" falsevalue="" label="Include isoform data" help="several different forms of a given protein are incorporated into database" /> | 93 <param name="include_isoform" type="boolean" truevalue="&include=yes" falsevalue="" label="Include isoform data" help="several different forms of a given protein are incorporated into database" /> |
68 </when> | 94 </when> |
69 <when value="cRAP" /> | 95 <when value="cRAP" /> |
96 <when value="HMP"> | |
97 <param name="site" type="select" label="Proteome for body site"> | |
98 <option value="Airways">HMP airways</option> | |
99 <option value="Blood">HMP Blood</option> | |
100 <option value="Gastrointestinal_tract">HMP Gastro-intestinal tract</option> | |
101 <option value="Oral">HMP Oral</option> | |
102 <option value="Skin">HMP Skin</option> | |
103 <option value="Urogenital_tract">HMP urogenital Tract</option> | |
104 </param> | |
105 </when> | |
106 <when value="EBI Metagenomics"> | |
107 <param name="ebi_project" value="" type="text" label="EBI Metagenomics Project (e.g. DRP003095)"> | |
108 <help><![CDATA[ | |
109 Look up EBI Metagenomics at https://www.ebi.ac.uk/metagenomics/search | |
110 ]]></help> | |
111 </param> | |
112 <param name="ebi_sample" value="" type="text" label="EBI Metagenomics Sample (e.g. DRS029200)"> | |
113 </param> | |
114 <param name="ebi_run" value="" type="text" label="EBI Metagenomics Run (e.g. DRR033743)"> | |
115 </param> | |
116 <param name="ebi_version" value="" type="text" label="EBI Metagenomics Pipeline Version (e.g. 3.0)"> | |
117 </param> | |
118 <param name="ebi_annotation" type="boolean" label="With Annotation" checked="true" | |
119 truevalue="PredictedCDSWithAnnotation" falsevalue="PredictedCDSWithioutAnnotation"/> | |
120 | |
121 </when> | |
122 <when value="HOMD"> | |
123 <param name="annotation" type="select" label="Human Oral Microbiome Proteome"> | |
124 <option value="oral_microbiome_dynamic.aa.zip">HOMD with dynamic annotation</option> | |
125 <option value="oral_microbiome.aa.tar.gz">HOMD with static annotation</option> | |
126 </param> | |
127 </when> | |
70 <when value="url"> | 128 <when value="url"> |
71 <param name="url" value="" type="text" label="URL (http, ftp)"> | 129 <param name="url" value="" type="text" label="URL (http, ftp) of Fasta sequences"> |
72 <sanitizer> | 130 <sanitizer> |
73 <valid> | 131 <valid> |
74 <add value="%"/> | 132 <add value="%"/> |
133 <add value="~"/> | |
75 </valid> | 134 </valid> |
76 </sanitizer> | 135 </sanitizer> |
136 </param> | |
137 <param name="archive_type" type="select" label="Fasta source compression type"> | |
138 <option value="direct" selected="true">fasta file (uncompressed)</option> | |
139 <option value="gzip">fasta.gz (gzip compressed)</option> | |
140 <option value="bzip2">fasta.bz2 (bzip2 compressed)</option> | |
141 <option value="zip">fasta.zip or fasta.Z (Zip compressed)</option> | |
142 <option value="tgz">fasta.tgz or fasta.tar.gz (tar archive gzip compressed)</option> | |
143 <option value="tbz">fasta.tbz or fasta.tar.bz (tar archive bzip2 compressed)</option> | |
77 </param> | 144 </param> |
78 </when> | 145 </when> |
79 </conditional> | 146 </conditional> |
80 </inputs> | 147 </inputs> |
81 <outputs> | 148 <outputs> |
82 <data format="fasta" name="output_database" label="Protein Database" /> | 149 <data format="fasta" name="output_database" label="Protein Database ${source.from}" /> |
83 </outputs> | 150 </outputs> |
84 <tests> | 151 <tests> |
85 <test> | 152 <test> |
86 <param name="from" value="cRAP" /> | 153 <param name="from" value="cRAP" /> |
87 <output name="output_database"> | 154 <output name="output_database"> |
88 <assert_contents> | 155 <assert_contents> |
89 <has_text text="KKA1_ECOLX" /> | 156 <has_text text="KKA1_ECOLX" /> |
90 </assert_contents> | 157 </assert_contents> |
91 </output> | 158 </output> |
92 </test> | 159 </test> |
160 <test> | |
161 <param name="from" value="url" /> | |
162 <param name="url" value="https://raw.githubusercontent.com/pravs3683/cRAP/master/cRAP_protein_database.fasta" /> | |
163 <param name="archive_type" value="direct" /> | |
164 <output name="output_database"> | |
165 <assert_contents> | |
166 <has_text text="KKA1_ECOLX" /> | |
167 </assert_contents> | |
168 </output> | |
169 </test> | |
170 <test> | |
171 <param name="from" value="EBI Metagenomics" /> | |
172 <param name="ebi_project" value="DRP003095" /> | |
173 <param name="ebi_sample" value="DRS029200" /> | |
174 <param name="ebi_run" value="DRR033743" /> | |
175 <param name="ebi_version" value="3.0" /> | |
176 <output name="output_database"> | |
177 <assert_contents> | |
178 <has_text text="DRR033743" /> | |
179 </assert_contents> | |
180 </output> | |
181 </test> | |
93 </tests> | 182 </tests> |
94 <help> | 183 <help> |
95 <![CDATA[ | 184 <![CDATA[ |
96 **Output** | 185 **Output** |
97 | 186 |
98 Creates a FASTA file of specified protein sequences for comparison with experimental MS/MS data in search algorithm. | 187 Creates a FASTA file of specified protein sequences for comparison with experimental MS/MS data in search algorithm. |
99 | 188 |
100 **External Links** | 189 **External Links** |
101 | 190 |
102 _Galaxy-P 101 shows usage Protein Database Downloader tool in the creation of a workflow | 191 - Galaxy-P_101_ shows usage Protein Database Downloader tool in the creation of a workflow |
103 .. _Galaxy-P 101: http://msi-galaxy-p.readthedocs.org/en/latest/sections/galaxyp_101.html | 192 - UniProtKB_ provides additional information about the UniProt Knowledgebase |
104 _UniProtKB provides additional information about the UniProt Knowledgebase | 193 |
194 | |
195 .. _Galaxy-P_101: http://msi-galaxy-p.readthedocs.org/en/latest/sections/galaxyp_101.html | |
105 .. _UniProtKB: http://www.uniprot.org/help/uniprotkb | 196 .. _UniProtKB: http://www.uniprot.org/help/uniprotkb |
197 | |
198 | |
199 **Additional Protein Fasta URLs** | |
200 | |
201 *HUMAN GUT METAPROTEOME:* | |
202 | |
203 * 512MB gzip ftp://public.genomics.org.cn/BGI/gutmeta/UniSet/UniGene.pep.gz | |
204 * 61MB gzip http://www.bork.embl.de/~arumugam/Qin_et_al_2010/frequent_microbe_proteins.fasta.gz | |
205 | |
206 | |
207 *MOUSE GUT MICROBIOTA:* | |
208 | |
209 * 417MB gzip ftp://climb.genomics.cn/pub/10.5524/100001_101000/100114/Genecatalog/184sample_2.6M.GeneSet.pep.gz | |
210 * See: http://gigadb.org/dataset/view/id/100114/token/mZlMYJIF04LshpgP | |
211 | |
212 | |
106 ]]> | 213 ]]> |
107 </help> | 214 </help> |
215 <citations> | |
216 <citation type="doi">10.1093/nar/gkw1099</citation> | |
217 <citation type="doi">10.1093/nar/gkv1195 </citation> | |
218 <citation type="doi">10.1093/database/baq013</citation> | |
219 <citation type="doi">10.1038/nature11209</citation> | |
220 <citation type="doi">10.1038/nature11234</citation> | |
221 </citations> | |
108 </tool> | 222 </tool> |
109 | 223 |