annotate protein_prophet.xml @ 12:4c66453a168e draft

Uploaded
author iracooke
date Mon, 16 Jun 2014 07:17:09 -0400
parents
children d90c8bc10a9c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
12
4c66453a168e Uploaded
iracooke
parents:
diff changeset
1 <tool id="proteomics_search_protein_prophet_1" name="Protein Prophet" version="1.0.1">
4c66453a168e Uploaded
iracooke
parents:
diff changeset
2 <requirements>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
3 <requirement type="package" version="1.3">protk</requirement>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
4 <requirement type="package" version="4.6.3">trans_proteomic_pipeline</requirement>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
5 </requirements>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
6
4c66453a168e Uploaded
iracooke
parents:
diff changeset
7 <description>Calculate Protein Prophet statistics on search results</description>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
8
4c66453a168e Uploaded
iracooke
parents:
diff changeset
9
4c66453a168e Uploaded
iracooke
parents:
diff changeset
10 <!-- Note .. the input file is assumed to be the first argument -->
4c66453a168e Uploaded
iracooke
parents:
diff changeset
11 <command>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
12 protein_prophet.rb
4c66453a168e Uploaded
iracooke
parents:
diff changeset
13
4c66453a168e Uploaded
iracooke
parents:
diff changeset
14 --galaxy $input_file
4c66453a168e Uploaded
iracooke
parents:
diff changeset
15
4c66453a168e Uploaded
iracooke
parents:
diff changeset
16 -o protein_prophet_results.prot.xml
4c66453a168e Uploaded
iracooke
parents:
diff changeset
17
4c66453a168e Uploaded
iracooke
parents:
diff changeset
18 -r
4c66453a168e Uploaded
iracooke
parents:
diff changeset
19
4c66453a168e Uploaded
iracooke
parents:
diff changeset
20 $iproph
4c66453a168e Uploaded
iracooke
parents:
diff changeset
21 $nooccam
4c66453a168e Uploaded
iracooke
parents:
diff changeset
22 $groupwts
4c66453a168e Uploaded
iracooke
parents:
diff changeset
23 $normprotlen
4c66453a168e Uploaded
iracooke
parents:
diff changeset
24 $logprobs
4c66453a168e Uploaded
iracooke
parents:
diff changeset
25 $confem
4c66453a168e Uploaded
iracooke
parents:
diff changeset
26 $allpeps
4c66453a168e Uploaded
iracooke
parents:
diff changeset
27 $unmapped
4c66453a168e Uploaded
iracooke
parents:
diff changeset
28 $instances
4c66453a168e Uploaded
iracooke
parents:
diff changeset
29 $delude
4c66453a168e Uploaded
iracooke
parents:
diff changeset
30
4c66453a168e Uploaded
iracooke
parents:
diff changeset
31 --minprob=$minprob
4c66453a168e Uploaded
iracooke
parents:
diff changeset
32 --minindep=$minindep
4c66453a168e Uploaded
iracooke
parents:
diff changeset
33 </command>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
34 <inputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
35
4c66453a168e Uploaded
iracooke
parents:
diff changeset
36 <param name="input_file" type="data" format="peptideprophet_pepxml,interprophet_pepxml" multiple="false" label="Peptide Prophet Results" help="These files will typically be outputs from peptide prophet or interprophet"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
37
4c66453a168e Uploaded
iracooke
parents:
diff changeset
38
4c66453a168e Uploaded
iracooke
parents:
diff changeset
39 <param name="iproph" selected="true" type="boolean" label="Inputs are from iProphet" truevalue="--iprophet-input" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
40 <param name="nooccam" type="boolean" label="Don't apply Occam's razor" help="When selected no attempt will be made to derive the simplest protein list explaining observed peptides" truevalue="--no-occam" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
41 <param name="groupwts" type="boolean" label="Use group weights" help="Check peptide's total weight (rather than actual weight) in the Protein Group against the threshold" truevalue="--group-wts" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
42 <param name="normprotlen" type="boolean" label="Normalize NSP using Protein Length" truevalue="--norm-protlen" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
43 <param name="logprobs" type="boolean" label="Use the log of probability in the confidence calculations" truevalue="--log-prob" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
44 <param name="confem" type="boolean" label="Use the EM to compute probability given the confidenct" truevalue="--confem" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
45 <param name="allpeps" type="boolean" label="Consider all possible peptides in the database in the confidence model" truevalue="--allpeps" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
46 <param name="unmapped" type="boolean" label="Report results for unmapped proteins" truevalue="--unmapped" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
47 <param name="instances" type="boolean" label="Use Expected Number of Ion Instances to adjust the peptide probabilities prior to NSP adjustment" truevalue="--instances" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
48 <param name="delude" type="boolean" label="Do NOT use peptide degeneracy information when assessing proteins" truevalue="--delude" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
49
4c66453a168e Uploaded
iracooke
parents:
diff changeset
50 <param name="minprob" type="text" label="Minimum peptide prophet probability for peptides to be considered" value="0.05"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
51 <param name="minindep" type="text" label="Minimum percentage of independent peptides required for a protein" value="0"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
52
4c66453a168e Uploaded
iracooke
parents:
diff changeset
53 </inputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
54 <outputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
55 <data format="protxml" name="output" metadata_source="input_file" label="protein_prophet.${input_file.display_name}.protXML" from_work_dir="protein_prophet_results.prot.xml"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
56 </outputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
57
4c66453a168e Uploaded
iracooke
parents:
diff changeset
58
4c66453a168e Uploaded
iracooke
parents:
diff changeset
59 <!--NOPLOT: do not generate plot png file
4c66453a168e Uploaded
iracooke
parents:
diff changeset
60 NOOCCAM: non-conservative maximum protein list
4c66453a168e Uploaded
iracooke
parents:
diff changeset
61 GROUPWTS: check peptide's total weight in the Protein Group against the threshold (default: check peptide's actual weight against threshold)
4c66453a168e Uploaded
iracooke
parents:
diff changeset
62 NORMPROTLEN: Normalize NSP using Protein Length
4c66453a168e Uploaded
iracooke
parents:
diff changeset
63 LOGPROBS: Use the log of the probabilities in the Confidence calculations
4c66453a168e Uploaded
iracooke
parents:
diff changeset
64 CONFEM: Use the EM to compute probability given the confidence
4c66453a168e Uploaded
iracooke
parents:
diff changeset
65 ALLPEPS: Consider all possible peptides in the database in the confidence model
4c66453a168e Uploaded
iracooke
parents:
diff changeset
66 UNMAPPED: Report results for UNMAPPED proteins
4c66453a168e Uploaded
iracooke
parents:
diff changeset
67 INSTANCES: Use Expected Number of Ion Instances to adjust the peptide probabilities prior to NSP adjustment
4c66453a168e Uploaded
iracooke
parents:
diff changeset
68 DELUDE: do NOT use peptide degeneracy information when assessing proteins
4c66453a168e Uploaded
iracooke
parents:
diff changeset
69
4c66453a168e Uploaded
iracooke
parents:
diff changeset
70 MINPROB: peptideProphet probabilty threshold (default=0.05)
4c66453a168e Uploaded
iracooke
parents:
diff changeset
71 MININDEP: minimum percentage of independent peptides required for a protein (default=0)
4c66453a168e Uploaded
iracooke
parents:
diff changeset
72
4c66453a168e Uploaded
iracooke
parents:
diff changeset
73
4c66453a168e Uploaded
iracooke
parents:
diff changeset
74 -->
4c66453a168e Uploaded
iracooke
parents:
diff changeset
75
4c66453a168e Uploaded
iracooke
parents:
diff changeset
76 <help>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
77
4c66453a168e Uploaded
iracooke
parents:
diff changeset
78 **What it does**
4c66453a168e Uploaded
iracooke
parents:
diff changeset
79
4c66453a168e Uploaded
iracooke
parents:
diff changeset
80 Given a set of peptide assignments from MS/MS spectra in the form of a pepXML file, this tool estimates probabilities at the protein level. As output, the tool produces a protXML file, which contains proteins along with the estimated probabilities that those proteins were present. Probabilities are estimated using a statistical model based on the number of peptides corresponding to that protein and the confidence that each of those peptides were assigned correctly. It takes account of the fact that peptides may correspond to more than one protein.
4c66453a168e Uploaded
iracooke
parents:
diff changeset
81
4c66453a168e Uploaded
iracooke
parents:
diff changeset
82 ----
4c66453a168e Uploaded
iracooke
parents:
diff changeset
83
4c66453a168e Uploaded
iracooke
parents:
diff changeset
84 **Citation**
4c66453a168e Uploaded
iracooke
parents:
diff changeset
85
4c66453a168e Uploaded
iracooke
parents:
diff changeset
86 If you use this tool please read and cite the paper describing the statistical model implemented by Protein Prophet
4c66453a168e Uploaded
iracooke
parents:
diff changeset
87
4c66453a168e Uploaded
iracooke
parents:
diff changeset
88 Nesvizhskii A., et al. “A Statistical Model for Identifying Proteins by Tandem Mass Spectrometry” *Anal. Chem.* 75, 4646-4658 (2003).
4c66453a168e Uploaded
iracooke
parents:
diff changeset
89
4c66453a168e Uploaded
iracooke
parents:
diff changeset
90
4c66453a168e Uploaded
iracooke
parents:
diff changeset
91 </help>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
92
4c66453a168e Uploaded
iracooke
parents:
diff changeset
93 </tool>