comparison proteinpilot_group_extractor.xml @ 8:0aa9d080713e

Update for ProteinPilot version 5.0
author Jim Johnson <jj@umn.edu>
date Thu, 05 Nov 2015 13:15:48 -0600
parents
children 8935cf27e8fd
comparison
equal deleted inserted replaced
7:ffbfff887a03 8:0aa9d080713e
1 <tool id="proteinpilot_group_extractor" name="ProteinPilot - GroupFileExtractor" version="5.0.0">
2 <description>convert group file to tabular reports, mzIndentML, and MGF</description>
3 <command>
4 <![CDATA[
5 #if $quant.use
6 #set $denom = $quant.dtype
7 #else
8 #set $denom = ""
9 #end if
10 #set $ptypes = str($ptype).split(',')
11 #set $cmd = []
12 #if 'PROTEIN' in $ptypes:
13 #set $cmd = $cmd + ['GroupFileExtractor.exe PROTEIN ' + str($input) + ' protein_report.txt ' + $denom]
14 #end if
15 #if 'PEPTIDE' in $ptypes:
16 #set $cmd = $cmd + ['GroupFileExtractor.exe PEPTIDE ' + str($input) + ' peptide_report.txt ' + $denom]
17 #end if
18 #if 'DISTINCT_PEPTIDE' in $ptypes:
19 #set $cmd = $cmd + ['GroupFileExtractor.exe DISTINCT_PEPTIDE ' + str($input) + ' distinct_peptide_report.txt ' + $denom]
20 #end if
21 #if 'SPECTRUM' in $ptypes:
22 #set $cmd = $cmd + ['GroupFileExtractor.exe SPECTRUM ' + str($input) + ' spectrum_report.txt ' + $denom]
23 #end if
24 #if 'FEATURES' in $ptypes:
25 #set $cmd = $cmd + ['GroupFileExtractor.exe FEATURES ' + str($input) + ' features_report.txt ' + $denom]
26 #end if
27 #if 'MZIDENTML' in $ptypes:
28 #set $cmd = $cmd + ['GroupFileExtractor.exe MZIDENTML ' + str($input) + ' mzidentml.mzid ' + $denom]
29 #end if
30 #if 'MGF' in $ptypes:
31 #set $cmd = $cmd + ['GroupFileExtractor.exe MGF ' + str($input) + ' output.mgf ' + $denom]
32 #end if
33 #if 'XML' in $ptypes:
34 #set $cmd = $cmd + ['GroupFileExtractor.exe XML ' + str($input) + ' results.xml ' + $denom]
35 #end if
36 #if 'METADATAXML' in $ptypes:
37 #set $cmd = $cmd + ['GroupFileExtractor.exe METADATAXML ' + str($input) + ' metadata.xml ' + $denom]
38 #end if
39 #if 'METADATACSV' in $ptypes:
40 #set $cmd = $cmd + ['GroupFileExtractor.exe METADATACSV ' + str($input) + ' metadata.csv ' + $denom]
41 #end if
42 #echo ' && '.join($cmd)
43 ]]>
44 </command>
45 <inputs>
46 <param format="group" name="input" type="data" label="ProteinPilot Group Data" help=""/>
47 <param name="ptype" type="select" multiple="true" label="Summary Type">
48 <option value="PROTEIN">PROTEIN</option>
49 <option value="PEPTIDE">PEPTIDE</option>
50 <option value="DISTINCT_PEPTIDE">DISTINCT_PEPTIDE</option>
51 <option value="SPECTRUM">SPECTRUM</option>
52 <option value="FEATURES">FEATURES</option>
53 <option value="MZIDENTML">MZIDENTML</option>
54 <option value="MGF">MGF</option>
55 <option value="XML">XML</option>
56 <option value="METADATAXML">METADATAXML</option>
57 <option value="METADATACSV">METADATACSV</option>
58 </param>
59 <conditional name="quant">
60 <param name="use" type="boolean" label="Include quantation results" truevalue="true" falsevalue="false" />
61 <when value="true">
62 <param name="dtype" type="select" label="Denominator">
63 <option value="IT113">113</option>
64 <option value="IT114" selected="true">114</option>
65 <option value="IT115">115</option>
66 <option value="IT116">116</option>
67 <option value="IT117">117</option>
68 <option value="IT118">118</option>
69 <option value="IT119">119</option>
70 <option value="IT121">121</option>
71 <option value="Light">Light</option>
72 <option value="Heavy">Heavy</option>
73 <option value="Medium">Medium</option>
74 </param>
75 </when>
76 <when value="false"/>
77 </conditional>
78 </inputs>
79 <outputs>
80 <data format="tabular" name="protein_report" label="PROTEIN report for ${on_string}" from_work_dir="protein_report.txt">
81 <filter>'PROTEIN' in ptype</filter>
82 </data>
83 <data format="tabular" name="peptide_report" label="PEPTIDE report for ${on_string}" from_work_dir="peptide_report.txt">
84 <filter>'PEPTIDE' in ptype</filter>
85 </data>
86 <data format="tabular" name="distinct_peptide_report" label="DISTINCT_PEPTIDE report for ${on_string}" from_work_dir="distinct_peptide_report.txt">
87 <filter>'DISTINCT_PEPTIDE' in ptype</filter>
88 </data>
89 <data format="tabular" name="spectrum_report" label="SPECTRUM report for ${on_string}" from_work_dir="spectrum_report.txt">
90 <filter>'SPECTRUM' in ptype</filter>
91 </data>
92 <data format="tabular" name="features_report" label="FEATURES report for ${on_string}" from_work_dir="features_report.txt">
93 <filter>'FEATURES' in ptype</filter>
94 </data>
95 <data format="mzid" name="mzidentml" label="mzIdentML for ${on_string}" from_work_dir="mzidentml.mzid">
96 <filter>'MZIDENTML' in ptype</filter>
97 </data>
98 <data format="mgf" name="mgf" label="mgf for ${on_string}" from_work_dir="output.mgf">
99 <filter>'MGF' in ptype</filter>
100 </data>
101 <data format="xml" name="results_xml" label="Results.xml for ${on_string}" from_work_dir="results.xml">
102 <filter>'XML' in ptype</filter>
103 </data>
104 <data format="xml" name="metadata_xml" label="Metadata.xml for ${on_string}" from_work_dir="metadata.xml">
105 <filter>'METADATAXML' in ptype</filter>
106 </data>
107 <data format="csv" name="metadata_csv" label="Metadata.csv for ${on_string}" from_work_dir="metadata.csv">
108 <filter>'METADATACSV' in ptype</filter>
109 </data>
110 </outputs>
111 <help>
112 <![CDATA[
113 **ProteinPilot GroupFileExtractor**
114
115 Requires ProteinPilot version 5
116
117
118 **INPUT**
119
120 A ProteinPilot .group file
121
122 **OUTPUTS**
123
124 Data can now be exported in the following formats:
125
126 (1) **Protein Summary**
127
128 A tabular report of detected proteins.
129
130 (2) **Peptide Summary**
131
132 A tabular report of detected proteins.
133
134 (3) **Distinct Peptide Summary**
135
136 The Distinct Peptide Summary export provides a summary of all peptide groups for each group that has at least one hypotheses with at least 15% confidence. The purpose is to report a list of all distinct physical peptides that have been detected. Each physical peptide can have multiple precursor charge states observed as detected, separate LCMS map features. To attempt to identify the peptide, each of these LCMS features can have MS/MS spectra triggered.
137
138 The process of identification does not always result in a clear single answer, so ambiguity in identification can occur. The purpose of the peptide group is to group all competitive hypotheses for a given physical peptide arising from the following three levels:
139
140 - multiple precursor charge states,
141 - multiple MS/MS spectra of a given charge state, and
142 - multiple answers for a given MS/MS spectrum.
143
144 The Distinct Peptide Summary export is unlike the previous Peptide Summary export, which exported information only about the peptides claimed by reported proteins. The Distinct Peptide Summary export shows all hypotheses that are within the margin of error of being the right answer, regardless of whether they are attached to reported proteins, making this export useful for peptide-centric workflows.
145
146 (4) **Spectrum Summary**
147
148 The spectrum export includes all of the top hits to each spectrum, making it spectrum- centric, rather than protein-peptide ID-centric. This gives the user a way to access all of the information, rather than just the protein-filtered information as is done with the existing Peptide Summary export.
149
150 (5) **mzIDentML**
151
152 The ProteinPilot software now exports search results in mzIDentML version 1.2 candidate format.* This is a standardized format developed by the Human Proteome Organizations (HUPO) Proteomics Standards Initiative (PSI) for reporting parameters and results from mass spectrometric database search engines. Users can most easily export to mzIDentML format from the export options available in the software, but exports can also be done programmatically.
153
154 http://onlinelibrary.wiley.com/doi/10.1002/pmic.201400080/abstract Seymour, Sean et al. "A standardized framing for reporting protein identifications in mzIdentML 1.2." Proteomics. doi: 10.1002/pmic.201400080.
155
156 (6) **MGF Peak list**
157
158 Recalibrated MGF (Mascot Generic File) peak lists can now be exported programmatically.
159
160 (7) **Metadata**
161
162 This is a new export option that provides metadata based on search criteria (for example, search date, time, other search parameters). Metadata can be exported in .txt or .xml file format.
163
164 (8) **Features**
165
166 The Features export contains all of the detected protein features (for example, post-translational modifications and sequence variants).
167 Confidence Interval (CI) columns added to Proteins Detected table
168 The ProteinPilot software now reports a confidence interval for SILAC and other MS- based quantitation workflows, such as SCIEX mTRAQ. Four new column options are hidden by default but can be shown on the Protein Quant tab in the Proteins Detected table: Upper CI M:L, Lower CI M:L, Upper CI H:L, and Lower CI H:L. Upper and Lower CI column headings reflect whether the user selected a Heavy (H) or Light (L) denominator.
169 N-15 universal labeling SILAC support
170 Quantitation of universally N-15 labeled SILAC duplex samples was introduced in ProteinPilot software 4.2 Beta but required some special configuration. This feature is now available by default and no longer requires any additional steps to perform this type of quantitation analysis.
171
172 ]]>
173 </help>
174 </tool>