Mercurial > repos > galaxyp > msgfplus
comparison msgfplus.xml @ 0:ee56530a559f draft
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/msgfplus commit bdb474693831a3375db79755e88641ad32b3b4e6
author | galaxyp |
---|---|
date | Sun, 21 Feb 2016 11:04:06 -0500 |
parents | |
children | 797c755b9e74 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:ee56530a559f |
---|---|
1 <tool id="msgfplus" name="MS-GF+" version="0.1"> | |
2 <description> | |
3 Identifies peptides in tandem mass spectra using the MS-GF+ search engine. | |
4 </description> | |
5 <requirements> | |
6 <requirement type="package" version="10089">msgfplus</requirement> | |
7 <environment_variable name="LC_ALL" action="set_to">C</environment_variable> | |
8 </requirements> | |
9 <stdio> | |
10 <exit_code range="1:" level="fatal" description="Job Failed" /> | |
11 <regex match="java.*Exception" level="fatal" description="Java Exception"/> | |
12 <regex match="Could not create the Java virtual machine" level="fatal" description="JVM Error"/> | |
13 </stdio> | |
14 <command> | |
15 <![CDATA[ | |
16 #set $db_name = $d.display_name.replace(".fasta", "") + ".fasta" | |
17 #set $input_name = $s.display_name | |
18 #set $output_name = $input_name.replace(".mzML", "") + ".mzid" | |
19 ln -s '$s' '${input_name}' && | |
20 ln -s '$d' '${db_name}' && | |
21 | |
22 echo \\#Mods > Mods.txt && | |
23 #set $common_mods = str($common_fixed_modifications) + "," + str($common_variable_modifications) | |
24 #for $mod in $common_mods.split(",") | |
25 echo '$mod.replace("_", ",")' >> Mods.txt && | |
26 #end for | |
27 | |
28 #for $mod in $custom_mods | |
29 echo '${mod.formula_or_mass},${mod.aa_specificity},${mod.fix_or_opt},${mod.position_specificity},${mod.mod_name}' >> Mods.txt && | |
30 #end for | |
31 | |
32 msgfjar=\$(which MSGFPlus.jar) && | |
33 ( [ -f "\$msgfjar" ] || (echo MSGFPlus.jar not found && exit 1)) && | |
34 | |
35 java -jar \$msgfjar | |
36 -s '$input_name' | |
37 -d '$db_name' | |
38 -thread \${GALAXY_SLOTS:-1} | |
39 -mod Mods.txt | |
40 -tda $tda | |
41 -t $t$precursor_ion_tol_units | |
42 -ti $advanced.isotope_low,$advanced.isotope_high | |
43 -m $advanced.m | |
44 -inst $inst | |
45 -e $e | |
46 -protocol $advanced.protocol | |
47 -ntt $ntt | |
48 -minLength $advanced.minLength | |
49 -maxLength $advanced.maxLength | |
50 -minCharge $advanced.minCharge | |
51 -maxCharge $advanced.maxCharge | |
52 -n $advanced.n | |
53 -addFeatures $advanced.addFeatures | |
54 && | |
55 mv '$output_name' output | |
56 ]]> | |
57 </command> | |
58 <inputs> | |
59 <param argument="-s" type="data" format="mzml" label="Input Raw MS File(s)"/> | |
60 <param argument="-d" type="data" format="fasta" label="Protein Database" help="Select FASTA database from history"/> | |
61 <param argument="-tda" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Search with on-the-fly decoy database?" help="MSGF+ uses XXX_ as an accession prefix to indicate a decoy hit" /> | |
62 <param argument="-t" type="float" value="10" label="Precursor mass tolerance" help="Error tolerance for matching peptide mass to precursor ion mass"/> | |
63 <param name="precursor_ion_tol_units" type="select" label="Precursor mass tolerance units" help="Daltons are common for low-res instruments, ppm for high-res instruments"> | |
64 <option value="ppm" selected="true">Parts per million (ppm)</option> | |
65 <option value="Da">Daltons</option> | |
66 </param> | |
67 <param argument="-inst" label="Instrument type" type="select" help="The instrument type that generated the MS/MS spectra is used to determine the scoring model"> | |
68 <option value="0" selected="true">Low-res (LCQ/LTQ)</option> | |
69 <option value="1" >High-res (LTQ-Orbitrap)</option> | |
70 <option value="2" >Q-TOF</option> | |
71 <option value="3" >Q-Exactive</option> | |
72 </param> | |
73 <param argument="-e" type="select" label="Enzyme" help="Enzyme used to digest proteins in sample preparation; trypsin is the most commonly used enzyme"> | |
74 <option value="0">Unspecific cleavage</option> | |
75 <option value="1" selected="true">Trypsin, no P rule</option> | |
76 <option value="2">Chymotrypsin, no P rule (FYWL)</option> | |
77 <option value="3">Lys-C, no P rule</option> | |
78 <option value="4">Lys-N</option> | |
79 <option value="5">Glu-C (glutamyl endopeptidase)</option> | |
80 <option value="6">Arg-C</option> | |
81 <option value="7">Asp-N</option> | |
82 <option value="8">Alpha-lytic protease</option> | |
83 <option value="9">No enzyme</option> | |
84 </param> | |
85 <param argument="-ntt" type="select" format="text" label="Number of tolerable termini" help="Semi-specific requires more time than fully specific; non-specific requires much more."> | |
86 <option value="2" selected="true">Fully specific (both termini match cleavage rules)</option> | |
87 <option value="1">Semi-specific (at least one terminus must match cleavage rules)</option> | |
88 <option value="0">Non-specific (neither terminus is required to match cleavage rules)</option> | |
89 </param> | |
90 | |
91 <param name="common_fixed_modifications" type="select" label="Common Fixed Modifications" multiple="true" help="Occurs in known places on peptide sequence. Hold the appropriate key while clicking to select multiple items"> | |
92 <option value="C2H3N1O1_C_fix_any_Carbamidomethyl" selected="true">Carbamidomethyl C</option> | |
93 <option value="144.102063_*_fix_N-term_iTRAQ4plex">iTRAQ 4-plex N-term</option> | |
94 <option value="144.102063_K_fix_any_iTRAQ4plex">iTRAQ 4-plex K</option> | |
95 <option value="225.155833_*_fix_N-term_TMT6plex">TMT 2-plex N-term</option> | |
96 <option value="225.155833_K_fix_any_TMT6plex">TMT 2-plex K</option> | |
97 <option value="229.162932_*_fix_N-term_TMT6plex">TMT 6-or-10-plex N-term</option> | |
98 <option value="229.162932_K_fix_any_TMT6plex">TMT 6-or-10-plex K</option> | |
99 <sanitizer invalid_char=""><valid initial="string.printable"><add value="["/><add value="]"/><add value=","/><add value="-"/></valid><mapping initial="none"></mapping></sanitizer> | |
100 </param> | |
101 <param name="common_variable_modifications" type="select" label="Common Variable Modifications" multiple="true" help="Can occur anywhere on the peptide sequence; adds additional error to search score. Hold the appropriate key while clicking to select multiple items"> | |
102 <option value="C2H2O1_K_opt_any_Acetyl">Acetylation K</option> | |
103 <option value="C2H2O_*_opt_Prot-N-term_Acetyl">Acetylation Protein N-term</option> | |
104 <option value="C2H3NO_C_opt_any_Carbamidomethyl">Carbamidomethyl C</option> | |
105 <option value="C2H3NO_*_opt_N-term_Carbamidomethyl">Carbamidomethyl N-term</option> | |
106 <option value="H-1N-1O1_N_opt_any_Deamidated">Deamidation N</option> | |
107 <option value="H-1N-1O1_Q_opt_any_Deamidated">Deamidation Q</option> | |
108 <option value="CH2_K_opt_any_Methyl">Methylation K</option> | |
109 <option value="O1_M_opt_any_Oxidation" selected="true">Oxidation M</option> | |
110 <option value="HO3P_S_opt_any_Phospho">Phosphorylation S</option> | |
111 <option value="HO3P_T_opt_any_Phospho">Phosphorylation T</option> | |
112 <option value="HO3P_Y_opt_any_Phospho">Phosphorylation Y</option> | |
113 <option value="H-2O-1_E_opt_N-term_Glu->pyro-Glu">Pyro-glu from E</option> | |
114 <option value="H-3N-1_Q_opt_N-term_Gln->pyro-Glu">Pyro-glu from Q</option> | |
115 <sanitizer invalid_char=""><valid initial="string.printable"><add value="["/><add value="]"/><add value=","/><add value="-"/></valid><mapping initial="none"></mapping></sanitizer> | |
116 </param> | |
117 | |
118 <repeat name="custom_mods" title="Custom Modifications" help="Specify modifications with custom parameters"> | |
119 <param name="formula_or_mass" type="text" label="Formula or Mass"> | |
120 <sanitizer> | |
121 <valid initial="string.digits"> | |
122 <add value="C"/> | |
123 <add value="H"/> | |
124 <add value="O"/> | |
125 <add value="N"/> | |
126 <add value="S"/> | |
127 <add value="P"/> | |
128 <add value="B"/><add value="r"/> | |
129 <add value="C"/><add value="l"/> | |
130 <add value="F"/><add value="e"/> | |
131 <add value="S"/> | |
132 <add value="."/> | |
133 <add value="-"/> | |
134 </valid> | |
135 </sanitizer> | |
136 </param> | |
137 <param name="aa_specificity" type="select" multiple="true" label="Amino Acid Specificity"> | |
138 <option value="*" selected="true">Any</option> | |
139 <option value="A">A</option> | |
140 <option value="C">C</option> | |
141 <option value="D">D</option> | |
142 <option value="E">E</option> | |
143 <option value="F">F</option> | |
144 <option value="G">G</option> | |
145 <option value="H">H</option> | |
146 <option value="I">I</option> | |
147 <option value="K">K</option> | |
148 <option value="L">L</option> | |
149 <option value="M">M</option> | |
150 <option value="N">N</option> | |
151 <option value="P">P</option> | |
152 <option value="Q">Q</option> | |
153 <option value="R">R</option> | |
154 <option value="S">S</option> | |
155 <option value="T">T</option> | |
156 <option value="V">V</option> | |
157 <option value="W">W</option> | |
158 <option value="Y">Y</option> | |
159 </param> | |
160 <param name="fix_or_opt" type="select" label="Variable or Fixed?"> | |
161 <option value="opt" selected="true">Variable</option> | |
162 <option value="fix">Fixed</option> | |
163 </param> | |
164 <param name="position_specificity" type="select" label="Positional Specificity"> | |
165 <option value="any" selected="true">Any</option> | |
166 <option value="n-term">Peptide N-terminal</option> | |
167 <option value="c-term">Peptide C-terminal</option> | |
168 <option value="prot-n-term">Protein N-terminal</option> | |
169 <option value="prot-c-term">Protein C-terminal</option> | |
170 </param> | |
171 <param name="mod_name" type="text" label="Name" help="If this mod has an entry there in Unimod, this name should match its name there" /> | |
172 </repeat> | |
173 | |
174 <!-- MS-GF+ ADVANCED PARAMETERS --> | |
175 <section name="advanced" title="Advanced Options"> | |
176 <param argument="-minCharge" label="Minimum precursor charge" value="2" type="integer" help="Minimum precursor charge to consider if charges are not specified in the spectrum file"/> | |
177 <param argument="-maxCharge" label="Maximum precursor charge" value="3" type="integer" help="Maximum precursor charge to consider if charges are not specified in the spectrum file"/> | |
178 <param argument="-minLength" label="Minimum peptide length" value="6" type="integer" help="Minimum peptide length to consider"/> | |
179 <param argument="-maxLength" label="Maximum peptide length" value="40" type="integer" help="Maximum peptide length to consider"/> | |
180 <param name="num_ptms" label="Maximum modifications allowed per peptide" type="integer" value="2" /> | |
181 <param argument="-m" label="Fragmentation type" type="select" help="Fragmentation method identifier (used to determine the scoring model)"> | |
182 <option value="0" selected="True">As written in the spectrum or CID if no info</option> | |
183 <option value="1" >CID</option> | |
184 <option value="2" >ETD</option> | |
185 <option value="3" >HCD</option> | |
186 </param> | |
187 <param argument="-protocol" label="Protocol type" type="select" help="Protocols are used to enable scoring parameters for enriched and/or labeled samples"> | |
188 <option value="0" selected="True">Automatic</option> | |
189 <option value="1" >Phosphorylation</option> | |
190 <option value="2" >iTRAQ</option> | |
191 <option value="3" >iTRAQPhospho</option> | |
192 <option value="4" >TMT</option> | |
193 <option value="5" >Standard</option> | |
194 </param> | |
195 <param argument="-n" label="Maximum matches per spectrum" type="integer" value="1" help="Number of peptide matches per spectrum to report" /> | |
196 <param argument="-addFeatures" label="Calculate additional scoring features?" type="boolean" truevalue="1" falsevalue="0" help="If true, several extra derivative scores are calculated for each match" /> | |
197 <param name="isotope_low" label="Lower isotope error range" type="integer" value="0" help="Takes into account of the error introduced by chooosing a non-monoisotopic peak for fragmentation (-ti)" /> | |
198 <param name="isotope_high" label="Upper isotope error range" type="integer" value="1" /> | |
199 </section> | |
200 </inputs> | |
201 <outputs> | |
202 <data name="output" format="mzid" from_work_dir="output" /> | |
203 </outputs> | |
204 <tests> | |
205 <test> | |
206 <param name="s" value="input/201208-378803.mzML" /> | |
207 <param name="d" value="input/cow.protein.PRG2012-subset.fasta" /> | |
208 <param name="tda" value="1" /> | |
209 <param name="ntt" value="1" /> | |
210 <param name="t" value="50" /> | |
211 <param name="precursor_ion_tol_units" value="ppm" /> | |
212 <param name="common_fixed_modifications" value="" /> | |
213 <param name="common_variable_modifications" value="" /> | |
214 <output name="output" file="201208-378803-msgf-50ppm-semitryptic-no_mods.mzid" lines_diff="6" /> | |
215 </test> | |
216 <test> | |
217 <param name="s" value="input/201208-378803.mzML" /> | |
218 <param name="d" value="input/cow.protein.PRG2012-subset.fasta" /> | |
219 <param name="tda" value="1" /> | |
220 <param name="t" value="0.02" /> | |
221 <param name="precursor_ion_tol_units" value="Da" /> | |
222 <param name="isotope_low" value="-1" /> | |
223 <param name="isotope_high" value="0" /> | |
224 <param name="m" value="3" /> | |
225 <param name="inst" value="2" /> | |
226 <param name="e" value="3" /> | |
227 <param name="protocol" value="2" /> | |
228 <param name="minLength" value="10" /> | |
229 <param name="maxLength" value="20" /> | |
230 <param name="minCharge" value="2" /> | |
231 <param name="maxCharge" value="6" /> | |
232 <param name="n" value="2" /> | |
233 <param name="addFeatures" value="1" /> | |
234 | |
235 <param name="common_fixed_modifications" value="C2H3N1O1_C_fix_any_Carbamidomethyl,144.102063_*_fix_N-term_iTRAQ4plex,144.102063_K_fix_any_iTRAQ4plex" /> | |
236 <param name="common_variable_modifications" value="O1_M_opt_any_Oxidation,H-3N-1_Q_opt_N-term_Gln->pyro-Glu" /> | |
237 | |
238 <param name="custom_mods_0|formula_or_mass" value="C-2H-2O-2" /> | |
239 <param name="custom_mods_0|aa_specificity" value="G" /> | |
240 <param name="custom_mods_0|fix_or_opt" value="opt" /> | |
241 <param name="custom_mods_0|position_specificity" value="c-term" /> | |
242 <param name="custom_mods_0|mod_name" value="Gly-loss+Amide" /> | |
243 | |
244 <param name="custom_mods_1|formula_or_mass" value="C10H10N5O7P" /> | |
245 <param name="custom_mods_1|aa_specificity" value="CS" /> | |
246 <param name="custom_mods_1|fix_or_opt" value="opt" /> | |
247 <param name="custom_mods_1|position_specificity" value="any" /> | |
248 <param name="custom_mods_1|mod_name" value="cGMP" /> | |
249 | |
250 <output name="output" file="201208-378803-msgf-2mmu-tryptic-many_mods.mzid" lines_diff="6" /> | |
251 </test> | |
252 </tests> | |
253 <help> | |
254 **What it does** | |
255 | |
256 Performs protein identification via database search using MS-GF+. | |
257 | |
258 </help> | |
259 <citations> | |
260 <citation type="doi">10.1038/ncomms6277</citation> | |
261 <citation type="doi">10.1021/pr8001244</citation> | |
262 <citation type="bibtex">@misc{toolsGalaxyP, author = {Chilton, J, Gruening, B, Chambers, MC, et al.}, title = {Galaxy Proteomics Tools}, publisher = {GitHub}, journal = {GitHub repository}, | |
263 year = {2015}, url = {https://github.com/galaxyproteomics/tools-galaxyp}}</citation> <!-- TODO: fix substitution of commit ", commit = {$sha1$}" --> | |
264 </citations> | |
265 </tool> |