annotate peptide_prophet.xml @ 12:4c66453a168e draft

Uploaded
author iracooke
date Mon, 16 Jun 2014 07:17:09 -0400
parents
children b793fe628648
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
12
4c66453a168e Uploaded
iracooke
parents:
diff changeset
1 <tool id="proteomics_search_peptide_prophet_1" name="Peptide Prophet" version="1.0.1">
4c66453a168e Uploaded
iracooke
parents:
diff changeset
2 <requirements>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
3 <requirement type="package" version="1.3">protk</requirement>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
4 <requirement type="package" version="4.6.3">trans_proteomic_pipeline</requirement>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
5 </requirements>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
6
4c66453a168e Uploaded
iracooke
parents:
diff changeset
7 <description>Calculate Peptide Prophet statistics on search results</description>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
8
4c66453a168e Uploaded
iracooke
parents:
diff changeset
9 <command>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
10 peptide_prophet.rb --galaxy $input_file -o peptide_prophet_output.pep.xml
4c66453a168e Uploaded
iracooke
parents:
diff changeset
11
4c66453a168e Uploaded
iracooke
parents:
diff changeset
12 -r
4c66453a168e Uploaded
iracooke
parents:
diff changeset
13 $glyco
4c66453a168e Uploaded
iracooke
parents:
diff changeset
14 $useicat
4c66453a168e Uploaded
iracooke
parents:
diff changeset
15 $phospho
4c66453a168e Uploaded
iracooke
parents:
diff changeset
16 $usepi
4c66453a168e Uploaded
iracooke
parents:
diff changeset
17 $usert
4c66453a168e Uploaded
iracooke
parents:
diff changeset
18 $accurate_mass
4c66453a168e Uploaded
iracooke
parents:
diff changeset
19 $no_ntt
4c66453a168e Uploaded
iracooke
parents:
diff changeset
20 $no_nmc
4c66453a168e Uploaded
iracooke
parents:
diff changeset
21 $use_gamma
4c66453a168e Uploaded
iracooke
parents:
diff changeset
22 $use_only_expect
4c66453a168e Uploaded
iracooke
parents:
diff changeset
23 $force_fit
4c66453a168e Uploaded
iracooke
parents:
diff changeset
24 $allow_alt_instruments
4c66453a168e Uploaded
iracooke
parents:
diff changeset
25 $maldi
4c66453a168e Uploaded
iracooke
parents:
diff changeset
26
4c66453a168e Uploaded
iracooke
parents:
diff changeset
27 </command>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
28
4c66453a168e Uploaded
iracooke
parents:
diff changeset
29 <inputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
30
4c66453a168e Uploaded
iracooke
parents:
diff changeset
31 <param name="input_file" type="data" format="raw_pepxml" multiple="false" label="Raw Search Results" help="These files will typically be outputs from omssa or xtandem search tools"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
32
4c66453a168e Uploaded
iracooke
parents:
diff changeset
33 <param name="glyco" type="boolean" label="Expect true positives to have a glycocapture motif" truevalue="--glyco" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
34 <param name="useicat" type="boolean" label="Use icat information" truevalue="--useicat" falsevalue="--no-useicat"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
35 <param name="phospho" type="boolean" label="Use phospho information" truevalue="--phospho" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
36 <param name="usepi" type="boolean" label="Use pI information" truevalue="--usepi" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
37 <param name="usert" type="boolean" label="Use hydrophobicity / RT information" truevalue="--usert" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
38 <param name="accurate_mass" type="boolean" label="Use accurate mass binning" truevalue="--accurate-mass" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
39 <param name="no_ntt" type="boolean" label="Don't use NTT model" truevalue="--no-ntt" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
40 <param name="no_nmc" type="boolean" label="Don't use NMC model" truevalue="--no-nmc" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
41 <param name="use_gamma" type="boolean" label="Use Gamma distribution to model the negatives" help="Applies only to X!Tandem results" truevalue="--usegamma" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
42 <param name="use_only_expect" type="boolean" label="Only use Expect Score as the discriminant" help="Applies only to X!Tandem results.
4c66453a168e Uploaded
iracooke
parents:
diff changeset
43 Helpful for data with homologous top hits e.g. phospho or glyco" truevalue="--use-only-expect" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
44 <param name="force_fit" type="boolean" label="Force fitting" help="Bypasses automatic mixture model checks and forces fitting of a mixture model" truevalue="--force-fit" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
45 <param name="allow_alt_instruments" type="boolean" label="Allow multiple instrument types" help="Warning instead of exit with error if instrument types between runs is different" truevalue="--allow-alt-instruments" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
46 <param name="maldi" type="boolean" label="Maldi data" truevalue="-l" falsevalue=""/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
47
4c66453a168e Uploaded
iracooke
parents:
diff changeset
48
4c66453a168e Uploaded
iracooke
parents:
diff changeset
49 </inputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
50 <outputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
51 <data format="peptideprophet_pepxml" name="output" metadata_source="input_file" label="peptide_prophet.${input_file.display_name}.pep.xml" from_work_dir="peptide_prophet_output.pep.xml"/>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
52 </outputs>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
53
4c66453a168e Uploaded
iracooke
parents:
diff changeset
54 <help>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
55
4c66453a168e Uploaded
iracooke
parents:
diff changeset
56 **What it does**
4c66453a168e Uploaded
iracooke
parents:
diff changeset
57
4c66453a168e Uploaded
iracooke
parents:
diff changeset
58 Given raw search engine scores as inputs this tool estimates the accuracy of peptide assignments. From a practical perspective it estimates the probability that each peptide assignment is correct (providing probabilities as outputs), given raw scores (possibly on some arbitrary scale) as inputs.
4c66453a168e Uploaded
iracooke
parents:
diff changeset
59
4c66453a168e Uploaded
iracooke
parents:
diff changeset
60 ----
4c66453a168e Uploaded
iracooke
parents:
diff changeset
61
4c66453a168e Uploaded
iracooke
parents:
diff changeset
62 **Citation**
4c66453a168e Uploaded
iracooke
parents:
diff changeset
63
4c66453a168e Uploaded
iracooke
parents:
diff changeset
64 If you use this tool please read and cite the paper describing the statistical model implemented by Peptide Prophet
4c66453a168e Uploaded
iracooke
parents:
diff changeset
65
4c66453a168e Uploaded
iracooke
parents:
diff changeset
66 Keller A., et al. “Empirical Statistical Model to Estimate the Accuracy of Peptide Identifications Made by MS/MS and Database Search” *Anal. Chem.* 74, 5383-5392 (2002).
4c66453a168e Uploaded
iracooke
parents:
diff changeset
67
4c66453a168e Uploaded
iracooke
parents:
diff changeset
68
4c66453a168e Uploaded
iracooke
parents:
diff changeset
69 </help>
4c66453a168e Uploaded
iracooke
parents:
diff changeset
70
4c66453a168e Uploaded
iracooke
parents:
diff changeset
71
4c66453a168e Uploaded
iracooke
parents:
diff changeset
72 <!--PeptideProphet options [following the 'O']:
4c66453a168e Uploaded
iracooke
parents:
diff changeset
73 i [use icat information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
74 f [do not use icat information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
75 g [use N-glyc motif information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
76 H [use Phospho information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
77 m [maldi data]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
78 I [use pI information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
79 R [use Hydrophobicity / RT information in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
80 F [force the fitting of the mixture model, bypass automatic mixture model checks]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
81 A [use accurate mass binning in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
82 w [warning instead of exit with error if instrument types between runs is different]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
83 x [exclude all entries with asterisked score values in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
84 l [leave alone all entries with asterisked score values in PeptideProphet]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
85 n [use hardcoded default initialization parameters of the distributions]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
86 P [use Non-parametric model, can only be used with decoy option]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
87 N [do not use the NTT model]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
88 M [do not use the NMC model]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
89 G [use Gamma Distribution to model the Negatives (applies only to X!Tandem data)]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
90 E [only use Expect Score as the Discriminant(applies only to X!Tandem data,
4c66453a168e Uploaded
iracooke
parents:
diff changeset
91 helpful for data with homologous top hits e.g. phospho or glyco)]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
92 d [report decoy hits with a computed probability based on the model learned]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
93 p [run ProteinProphet afterwards]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
94 t [do not create png data plot]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
95 u [do not assemble protein groups in ProteinProphet analysis]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
96 s [do not use Occam's Razor in ProteinProphet analysis to
4c66453a168e Uploaded
iracooke
parents:
diff changeset
97 derive the simplest protein list to explain observed peptides]
4c66453a168e Uploaded
iracooke
parents:
diff changeset
98 -->
4c66453a168e Uploaded
iracooke
parents:
diff changeset
99
4c66453a168e Uploaded
iracooke
parents:
diff changeset
100 </tool>