annotate unipept.xml @ 1:0c1ee95282fa draft

Uploaded
author galaxyp
date Tue, 14 Apr 2015 16:44:22 -0400
parents 6430407e5869
children 503ab8a39006
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
1 <tool id="unipept" name="Unipept" version="1.1.0">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
2 <description>retrieve taxonomy for peptides</description>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
3 <macros>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
4 <xml name="equate_il">
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
5 <param name="equate_il" type="boolean" truevalue="-e" falsevalue="" checked="true" label="Equate isoleucine and leucine">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
6 <help>isoleucine (I) and leucine (L) are equated when matching tryptic peptides to UniProt records</help>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
7 </param >
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
8 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
9 <xml name="extra">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
10 <param name="extra" type="boolean" truevalue="-x" falsevalue="" checked="false" label="retrieve extra information">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
11 <yield/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
12 </param >
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
13 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
14 <xml name="names">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
15 <param name="names" type="boolean" truevalue="-n" falsevalue="" checked="true" label="names" >
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
16 <help>return the names in complete taxonomic lineage</help>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
17 </param >
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
18 <param name="allfields" type="boolean" truevalue="-A" falsevalue="" checked="false" label="allfields" >
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
19 <help>include fields for most specific taxonomic classification: taxon_rank,taxon_id,taxon_name before lineage</help>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
20 </param >
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
21 </xml>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
22 </macros>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
23 <requirements>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
24 </requirements>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
25 <stdio>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
26 <exit_code range="1:" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
27 </stdio>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
28 <command interpreter="python"><![CDATA[
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
29 unipept.py
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
30 --api=$unipept.api
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
31 $unipept.equate_il $unipept.extra
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
32 #if $unipept.api != 'pept2prot':
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
33 $unipept.names $unipept.allfields
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
34 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
35 $strict
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
36 #if str($peptide_src.fmt) == 'proteomic':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
37 #if $peptide_src.input.datatype.file_ext == 'fasta':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
38 --fasta="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
39 #elif $peptide_src.input.datatype.file_ext == 'mzid':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
40 --mzid="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
41 #elif $peptide_src.input.datatype.file_ext == 'pepxml':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
42 --pepxml="$peptide_src.input"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
43 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
44 #elif str($peptide_src.fmt) == 'tabular':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
45 --tabular="$peptide_src.input_tsv"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
46 #set $col = int(str($peptide_src.column)) - 1
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
47 --column=$col
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
48 #elif str($peptide_src.fmt) == 'fasta':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
49 --fasta="$peptide_src.input_fasta"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
50 #elif str($peptide_src.fmt) == 'mzid':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
51 --mzid="$peptide_src.input_mzid"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
52 #elif str($peptide_src.fmt) == 'pepxml':
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
53 --pepxml="$peptide_src.input_pepxml"
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
54 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
55 #if 'json' in str($outputs).split(','):
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
56 --json $output_json
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
57 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
58 #if 'tsv' in str($outputs).split(','):
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
59 --tsv $output_tsv
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
60 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
61 #if 'csv' in str($outputs).split(','):
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
62 --csv $output_csv
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
63 #end if
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
64 #if 'unmatched' in str($outputs).split(','):
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
65 --unmatched $output_unmatched
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
66 #end if
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
67 ]]></command>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
68 <inputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
69 <conditional name="unipept">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
70 <param name="api" type="select" label="Unipept application" >
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
71 <option value="pept2lca" selected="true">pept2lca: lowest common ancestor</option>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
72 <option value="pept2taxa">pept2taxa: organisms associated with the UniProt entries containing a given tryptic peptide</option>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
73 <option value="pept2prot">pept2prot: UniProt entries containing a given tryptic peptide</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
74 </param>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
75 <when value="pept2lca">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
76 <expand macro="equate_il" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
77 <expand macro="extra">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
78 <help>Return the complete lineage of the taxonomic lowest common ancestor, and include ID fields.</help>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
79 </expand>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
80 <expand macro="names" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
81 </when>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
82 <when value="pept2taxa">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
83 <expand macro="equate_il" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
84 <expand macro="extra">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
85 <checked>true</checked>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
86 <help>Return the complete lineage of each organism, and include ID fields.</help>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
87 </expand>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
88 <expand macro="names" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
89 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
90 <when value="pept2prot">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
91 <expand macro="equate_il" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
92 <expand macro="extra">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
93 <help>Return additional information fields: taxon_name, ec_references, go_references, refseq_ids, refseq_protein_ids, insdc_ids, insdc_protein_ids
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
94 WARNING: Huge perfomance penalty! Only use for small number of peptides when the extra infomation is required.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
95 </help>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
96 </expand>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
97 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
98 </conditional>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
99 <conditional name="peptide_src">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
100 <param name="fmt" type="select" label="Peptides input format" >
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
101 <option value="proteomic">proteomics formats: mzid, pepxml, fasta</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
102 <option value="tabular">tabular</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
103 <option value="fasta">fasta</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
104 <option value="mzid">mzid</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
105 <option value="pepxml">pepxml</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
106 </param>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
107 <when value="proteomic">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
108 <param name="input" type="data" format="mzid,pepxml,fasta" label="Peptide Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
109 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
110 <when value="tabular">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
111 <param name="input_tsv" type="data" format="tabular" label="Tabular Input Containing Peptide column" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
112 <param name="column" label="Select column with peptides" type="data_column" numerical="false" data_ref="input_tsv" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
113 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
114 <when value="fasta">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
115 <param name="input_fasta" type="data" format="fasta" label="Peptide Fasta Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
116 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
117 <when value="mzid">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
118 <param name="input_mzid" type="data" format="mzid" label="mzIndetML Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
119 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
120 <when value="pepxml">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
121 <param name="input_pepxml" type="data" format="pepxml" label="mzIndetML Input" />
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
122 </when>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
123 </conditional>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
124 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Choose outputs">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
125 <option value="tsv" selected="true">tabular</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
126 <option value="csv">Comma Separated Values (.csv)</option>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
127 <option value="json">JSON</option>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
128 <option value="unmatched">Unmatched peptides</option>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
129 </param>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
130 <param name="strict" type="boolean" truevalue="--strict" falsevalue="" checked="false" label="Exit with error on invalid peptides, otherwise ignore them"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
131 </inputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
132 <outputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
133 <data name="output_json" format="json" label="${tool.name} ${unipept.api} on ${on_string} json">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
134 <filter>'json' in outputs</filter>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
135 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
136 <data name="output_tsv" format="tabular" label="${tool.name} ${unipept.api} on ${on_string} tsv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
137 <filter>'tsv' in outputs</filter>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
138 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
139 <data name="output_csv" format="csv" label="${tool.name} ${unipept.api} on ${on_string} csv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
140 <filter>'csv' in outputs</filter>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
141 </data>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
142 <data name="output_unmatched" format="tabular" label="${tool.name} ${unipept.api} on ${on_string} unmatched">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
143 <filter>'unmatched' in outputs</filter>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
144 </data>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
145 </outputs>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
146 <tests>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
147 <test>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
148 <param name="api" value="pept2lca"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
149 <param name="fmt" value="tabular"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
150 <param name="input_tsv" value="tryptic.tsv"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
151 <param name="column" value="2"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
152 <param name="extra" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
153 <param name="names" value="True"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
154 <param name="outputs" value="tsv,unmatched"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
155 <output name="output_tsv">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
156 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
157 <has_text text="Homininae" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
158 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
159 </output>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
160 <output name="output_unmatched">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
161 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
162 <has_text text="QTAMAV" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
163 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
164 </output>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
165 </test>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
166 <test>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
167 <param name="api" value="pept2lca"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
168 <param name="fmt" value="fasta"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
169 <param name="input_fasta" value="peptide.fa"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
170 <param name="equate_il" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
171 <param name="extra" value="True"/>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
172 <param name="names" value="True"/>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
173 <param name="outputs" value="json,tsv"/>
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
174 <output name="output_json">
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
175 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
176 <has_text text="VMDVNDHKPEFYNCSLPACTFTPEEAQVNFTGYVDEHASPHIPIDDLTMVVYDPDKGSNGTFLLSLGGPDAEAFSVSPERAAGSASVQVLVRVSALVDYERQTAMAV" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
177 </assert_contents>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
178 </output>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
179 <output name="output_tsv">
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
180 <assert_contents>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
181 <has_text text="9606" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
182 <has_text text="9598" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
183 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
184 </output>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
185 </test>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
186 <test>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
187 <param name="api" value="pept2taxa"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
188 <param name="fmt" value="fasta"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
189 <param name="input_fasta" value="peptide.fa"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
190 <param name="equate_il" value="True"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
191 <param name="extra" value="False"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
192 <param name="names" value="False"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
193 <param name="outputs" value="tsv"/>
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
194 <output name="output_tsv">
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
195 <assert_contents>
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
196 <has_text text="sapiens" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
197 <has_text text="troglodytes" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
198 <has_text text="Gorilla" />
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
199 <has_text text="Macaca" />
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
200 </assert_contents>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
201 </output>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
202 </test>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
203 </tests>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
204 <help><![CDATA[
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
205 **Unipept**
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
206
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
207 Retrieve Uniprot and taxanomic information for trypic peptides.
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
208
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
209 Unipept API documentation - http://unipept.ugent.be/apidocs
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
210
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
211 **Input**
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
212
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
213 Input peptides can be retrieved from tabular, fasta, mzid, or pepxml datasets.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
214
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
215 Processing deatils::
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
216
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
217 The input peptides are split into typtic peptide fragments in order to match the Unipept records.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
218 Only fragments that are complete tryptic peptides between 5 and 50 animo acid in length will be matched by Unipept.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
219 The match to the most specific tryptic fragment is reported.
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
220
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
221
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
222 **Unipept APIs**
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
223
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
224 **pept2prot** - http://unipept.ugent.be/apidocs/pept2prot
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
225
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
226 Returns the list of UniProt entries containing a given tryptic peptide. This is the same information as provided on the Protein matches tab when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
227
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
228 By default, each object contains the following information fields extracted from the UniProt record::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
229
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
230 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
231 uniprot_id: the UniProt accession number of the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
232 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
233
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
234 When the extra parameter is set to true, objects contain the following additional fields extracted from the UniProt record::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
235
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
236 taxon_name: the name of the organism associated with the matching UniProt record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
237 ec_references: a space separated list of associated EC numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
238 go_references: a space separated list of associated GO terms
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
239 refseq_ids: a space separated list of associated RefSeq accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
240 refseq_protein_ids: a space separated list of associated RefSeq protein accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
241 insdc_ids: a space separated list of associated insdc accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
242 insdc_protein_ids: a space separated list of associated insdc protein accession numbers
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
243
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
244
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
245 **pept2taxa** - http://unipept.ugent.be/apidocs/pept2taxa
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
246
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
247 Returns the set of organisms associated with the UniProt entries containing a given tryptic peptide. This is the same information as provided on the Lineage table tab when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
248
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
249 By default, each object contains the following information fields extracted from the UniProt record and NCBI taxonomy::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
250
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
251 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
252 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
253 taxon_name: the name of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
254 taxon_rank: the taxonomic rank of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
255
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
256 When the extra parameter is set to true, objects contain additional information about the lineages of the organism extracted from the NCBI taxonomy. The taxon id of each rank in the lineage is specified using the following information fields::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
257
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
258 superkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
259 kingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
260 subkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
261 superphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
262 phylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
263 subphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
264 superclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
265 class_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
266 subclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
267 infraclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
268 superorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
269 order_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
270 suborder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
271 infraorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
272 parvorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
273 superfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
274 family_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
275 subfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
276 tribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
277 subtribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
278 genus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
279 subgenus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
280 species_group_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
281 species_subgroup_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
282 species_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
283 subspecies_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
284 varietas_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
285 forma_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
286
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
287
1
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
288 **pept2lca** - http://unipept.ugent.be/apidocs/pept2lca
0c1ee95282fa Uploaded
galaxyp
parents: 0
diff changeset
289
0
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
290 Returns the taxonomic lowest common ancestor for a given tryptic peptide. This is the same information as provided when performing a search with the Tryptic Peptide Analysis in the web interface.
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
291
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
292 By default, each object contains the following information fields extracted from the UniProt record and NCBI taxonomy::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
293
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
294 peptide: the peptide that matched this record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
295 taxon_id: the NCBI taxon id of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
296 taxon_name: the name of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
297 taxon_rank: the taxonomic rank of the organism associated with the matching record
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
298
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
299 When the extra parameter is set to true, objects contain additional information about the lineage of the taxonomic lowest common ancestor extracted from the NCBI taxonomy. The taxon id of each rank in the lineage is specified using the following information fields::
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
300
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
301 superkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
302 kingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
303 subkingdom_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
304 superphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
305 phylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
306 subphylum_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
307 superclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
308 class_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
309 subclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
310 infraclass_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
311 superorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
312 order_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
313 suborder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
314 infraorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
315 parvorder_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
316 superfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
317 family_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
318 subfamily_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
319 tribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
320 subtribe_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
321 genus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
322 subgenus_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
323 species_group_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
324 species_subgroup_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
325 species_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
326 subspecies_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
327 varietas_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
328 forma_id
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
329
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
330
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
331 **Attributions**
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
332
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
333 The Unipept metaproteomics analysis pipeline
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
334 Bart Mesuere1,*, Griet Debyser2, Maarten Aerts3, Bart Devreese2, Peter Vandamme3 andPeter Dawyndt1
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
335 Article first published online: 11 FEB 2015
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
336 DOI: 10.1002/pmic.201400361
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
337 http://onlinelibrary.wiley.com/doi/10.1002/pmic.201400361/abstract;jsessionid=BFF1994E4C14DA73D7C907EB208AD710.f04t04
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
338
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
339 ]]></help>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
340 <citations>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
341 <citation type="doi">doi:10.1002/pmic.201400361</citation>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
342 </citations>
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
343
6430407e5869 Uploaded
galaxyp
parents:
diff changeset
344 </tool>