2
|
1 <tool id="dbbuilder" version="0.2.0" name="Protein Database Downloader">
|
0
|
2 <description>
|
|
3 </description>
|
|
4 <requirements>
|
|
5 <requirement type="binary">wget</requirement>
|
|
6 </requirements>
|
|
7 <stdio>
|
2
|
8 <exit_code range="1:" level="fatal" description="Error downloading database." />
|
|
9 <regex match="ERROR" level="fatal" source="stderr" description="Error downloading database." />
|
0
|
10 </stdio>
|
2
|
11 <!-- TODO: escape quotes. -->
|
|
12 <!-- Add NCBI and maxquant contaminants. -->
|
|
13 <!-- http://maxquant.org/contaminants.zip -->
|
|
14 <!-- ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/mRNA_Prot/human.protein.faa.gz-->
|
0
|
15 <command>
|
|
16 #if $source.from == "uniprot"
|
2
|
17 #set $url = "http://www.uniprot.org/uniprot/?query=taxonomy%3a%22" + str($source.taxon) + "%22" + str($source.set) + str($source.reviewed) + "&force=yes&format=fasta" + str($source.include_isoform)
|
|
18 #set $type = "direct"
|
0
|
19 #elif $source.from == "cRAP"
|
|
20 #set $url = "ftp://ftp.thegpm.org/fasta/cRAP/crap.fasta"
|
2
|
21 #set $type = "direct"
|
|
22 #elif $source.from == "url"
|
|
23 #set $url = $source.url
|
|
24 #set $type = "direct"
|
0
|
25 #end if
|
2
|
26 #if $type =="direct"
|
0
|
27 wget -nv '$url' -O '${output_database}'
|
2
|
28 #end if
|
0
|
29 </command>
|
|
30 <inputs>
|
|
31 <conditional name="source">
|
3
|
32 <param name="from" type="select" label="Download from" help="select database source. cRAP acts as a database for common MS contaminants. UniProtKB is a corss species collection of functional protein databases">
|
0
|
33 <option value="uniprot">UniProtKB</option>
|
|
34 <option value="cRAP">cRAP (contaminants)</option>
|
2
|
35 <option value="url">Custom URL</option>
|
0
|
36 </param>
|
|
37 <when value="uniprot">
|
3
|
38 <param name="taxon" type="select" format="text" help="select species for protein database">
|
0
|
39 <label>Taxonomy</label>
|
|
40 <options from_file="uniprot_taxons.loc">
|
|
41 <column name="name" index="0" />
|
|
42 <column name="value" index="1" />
|
|
43 </options>
|
|
44 </param>
|
3
|
45 <param name="reviewed" type="select" help="UniProtKB/TrEMBL (unreviewed)is a large, automatically annotated database- may contain redundant sequences, but there is a higher chance peptides will be identified. UniProtKB/Swiss-Prot (reviewed) is a smaller, manually annotated database- less of a chance peptides will be identified but less sequence redundancy">
|
2
|
46 <option value="+">UniProtKB</option>
|
|
47 <option value="+reviewed%3Ayes">UniProtKB/Swiss-Prot (reviewed only)</option>
|
|
48 <option value="+reviewed%3Ano">UniProtKB/TrEMBL (unreviewed only)</option>
|
|
49 <sanitizer>
|
|
50 <valid>
|
|
51 <add value="%"/>
|
|
52 </valid>
|
|
53 </sanitizer>
|
|
54 </param>
|
|
55 <param name="set" type="select" label="Proteome Set">
|
|
56 <option value="+">Any</option>
|
|
57 <option value="+keyword%3a1185" selected="true">Reference Proteome Set</option>
|
|
58 <option value="+keyword%3a181">Complete Proteome Set</option>
|
|
59 <sanitizer>
|
|
60 <valid>
|
|
61 <add value="%"/>
|
|
62 </valid>
|
|
63 </sanitizer>
|
|
64 </param>
|
3
|
65 <param name="include_isoform" type="boolean" truevalue="&include=yes" falsevalue="" label="Include isoform data" help="several different forms of a given protein are incorporated into database" />
|
0
|
66 </when>
|
2
|
67 <when value="cRAP" />
|
|
68 <when value="url">
|
|
69 <param name="url" value="" type="text" label="URL (http, ftp)">
|
|
70 <sanitizer>
|
|
71 <valid>
|
|
72 <add value="%"/>
|
|
73 </valid>
|
|
74 </sanitizer>
|
|
75 </param>
|
|
76 </when>
|
0
|
77 </conditional>
|
|
78 </inputs>
|
|
79 <outputs>
|
|
80 <data format="fasta" name="output_database" label="Protein Database" />
|
|
81 </outputs>
|
|
82 <help>
|
|
83 **Output**
|
|
84
|
3
|
85 Creates a FASTA file of specified protein sequences for comparison with experimental MS/MS data in search algorithm.
|
|
86
|
|
87 **External Links**
|
0
|
88
|
3
|
89 _Galaxy-P 101 shows usage Protein Database Downloader tool in the creation of a workflow
|
|
90 .. _Galaxy-P 101: http://msi-galaxy-p.readthedocs.org/en/latest/sections/galaxyp_101.html
|
|
91 _UniProtKB provides additional information about the UniProt Knowledgebase
|
|
92 .. _UniProtKB: http://www.uniprot.org/help/uniprotkb
|
0
|
93 </help>
|
|
94 </tool>
|
|
95
|