Repository 'xtandem'
hg clone https://toolshed.g2.bx.psu.edu/repos/iracooke/xtandem

Changeset 14:9d6e0ad4d600 (2015-03-26)
Previous changeset 13:c60d1f18fd85 (2014-07-01) Next changeset 15:0faaab4f192a (2015-10-20)
Commit message:
Docker support and update for protk 1.4
modified:
repository_dependencies.xml
tandem.xml
tandem_to_pepxml.xml
tool-data/tandem_mods.loc.sample
added:
README.rst
test-data/tandem_to_pepxml_test.tandem
test-data/testdb.fasta
test-data/tiny.mzML
removed:
README
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 README
--- a/README Tue Jul 01 11:06:33 2014 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,6 +0,0 @@
-Galaxy wrapper for running the X!Tandem search engine and converting results to pepXML
-
-Requirements:
-This package uses protk and the trans_proteomic_pipeline. These must be installed separately. 
-
-For instructions please see: https://github.com/iracooke/protk/#galaxy-integration
\ No newline at end of file
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 README.rst
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.rst Thu Mar 26 19:53:53 2015 -0400
b
@@ -0,0 +1,39 @@
+X!Tandem
+========
+
+Galaxy wrapper for running the X!Tandem search engine and converting results to pepXML
+
+Requirements
+------------
+
+This package uses protk_ and the trans_proteomic_pipeline_ which need to be present in order for the tool to work.
+
+.. _protk: https://github.com/iracooke/protk
+.. _trans_proteomic_pipeline: http://tools.proteomecenter.org/wiki/index.php?title=Software:TPP
+
+There are two ways you can satify these dependencies (choose one):
+
+1. **Manual Install:** Details on how to install protk_ and the trans_proteomic_pipeline_ manually are available here_.
+
+2. **Use Docker:** These tools are designed to run inside a docker_ container. If your galaxy supports `running tools within a docker container`__ you don't need to worry about dependencies. Simply install and things should just work.  The docker container itself is versioned and new versions of this tool will automatically download an update to the container if needed.
+
+.. _docker: https://www.docker.com/
+.. _here: https://github.com/iracooke/protk/#galaxy-integration
+.. _container: https://wiki.galaxyproject.org/Admin/Tools/Docker
+__ container_
+
+
+Further Info
+------------
+
+The source code for this tool and other protk galaxy tools is on github_.  Please visit the github page to contribute to the project or to `report an issue`__ 
+
+.. _github: https://github.com/iracooke/protk-galaxytools
+.. _issue: https://github.com/iracooke/protk-galaxytools/issues
+__ issue_
+
+
+Please visit the XTandem_ page on the GPM website for details of the search engine itself.
+
+.. _XTandem: http://www.thegpm.org/tandem/
+
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 repository_dependencies.xml
--- a/repository_dependencies.xml Tue Jul 01 11:06:33 2014 -0400
+++ b/repository_dependencies.xml Thu Mar 26 19:53:53 2015 -0400
b
@@ -1,4 +1,4 @@
 <?xml version="1.0"?>
 <repositories description="Proteomics datatypes">
-    <repository changeset_revision="f66f8ca7b7b9" name="proteomics_datatypes" owner="iracooke" toolshed="http://toolshed.g2.bx.psu.edu" />
+    <repository changeset_revision="ac51d9dbfb4d" name="proteomics_datatypes" owner="iracooke" toolshed="https://toolshed.g2.bx.psu.edu" />
  </repositories>
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 tandem.xml
--- a/tandem.xml Tue Jul 01 11:06:33 2014 -0400
+++ b/tandem.xml Thu Mar 26 19:53:53 2015 -0400
[
@@ -1,7 +1,8 @@
-<tool id="proteomics_search_tandem_1" name="X!Tandem MSMS Search" version="1.0.2">
+<tool id="proteomics_search_tandem_1" name="X!Tandem MSMS Search" version="1.1.0">
 
    <requirements>
-     <requirement type="package" version="1.3.0">protk</requirement>
+         <container type="docker">iracooke/protk-1.4.1</container>
+     <requirement type="package" version="1.4">protk</requirement>
    </requirements>
 
  <description>Run an X!Tandem Search</description>
@@ -44,7 +45,7 @@
 
  -f $fragment_ion_tol 
 
- -p $precursor_ion_tol 
+ -p $precursor_ion_tol
 
  $allow_multi_isotope_search 
 
@@ -86,9 +87,9 @@
  <when value="built_in">
  <param name="paramskey" type="select" format="text" >
  <label>Paramset</label>
-     <option value="gpm">GPM</option>
+ <option value="isb_kscore">ISB K-Score (Recommended for TPP)</option>
      <option value="isb_native">ISB Native</option>
- <option value="isb_kscore">ISB K-Score</option>
+     <option value="gpm">GPM</option>
  </param>
  </when>
  <when value="input_ref">
@@ -132,7 +133,7 @@
  <label>Missed Cleavages Allowed</label>
      <option value="0">0</option>
  <option value="1">1</option>
- <option value="2">2</option>
+ <option selected="true" value="2">2</option>
  </param>
 
  <param name="cleavage_semi" type="boolean" label="Allow semi-cleaved peptides" help="This can increase search time dramatically" truevalue="--cleavage-semi" falsevalue=""/>
@@ -143,42 +144,42 @@
 
  <param name="enzyme" type="select" format="text">
      <label>Enzyme</label>
- <option value="[R]|{P}">argc - [R]|{P}</option>
- <option value="[X]|[D]">aspn - [X]|[D]</option>
- <option value="[FLMWY]|{P}">chymotrypsin - [FLMWY]|{P}</option>
- <option value="[R]|[X]">clostripain - [R]|[X]</option>
- <option value="[M]|{P}">cnbr - [M]|{P}</option>
- <option value="[AGILV]|{P}">elastase - [AGILV]|{P}</option>
- <option value="[D]|{P}">formicacid - [D]|{P}</option>
- <option value="[DE]|{P}">gluc - [DE]|{P}</option>
- <option value="[E]|{P}">gluc_bicarb - [E]|{P}</option>
- <option value="[W]|[X]">iodosobenzoate - [W]|[X]</option>
- <option value="[K]|{P}">lysc - [K]|{P}</option>
- <option value="[K]|[X]">lysc-p - [K]|[X]</option>
- <option value="[X]|[K]">lysn - [X]|[K]</option>
- <option value="[X]|[AKRS]">lysn_promisc - [X]|[AKRS]</option>
- <option value="[X]|[X]">nonspecific - [X]|[X]</option>
- <option value="[FL]|[X]">pepsina - [FL]|[X]</option>
- <option value="[P]|[X]">protein_endopeptidase - [P]|[X]</option>
- <option value="[E]|[X]">staph_protease - [E]|[X]</option>
- <option value="[FMWY]|{P},[KR]|{P},[X]|[D]">tca - [FMWY]|{P},[KR]|{P},[X]|[D]</option>
- <option value="[KR]|{P}" selected="true">trypsin - [KR]|{P}</option>
- <option value="[FKLMRWY]|{P}">trypsin/chymotrypsin - [FKLMRWY]|{P}</option>
- <option value="[KR]|{P},[M]|{P}">trypsin/cnbr - [KR]|{P},[M]|{P}</option>
- <option value="[DEKR]|{P}">trypsin_gluc - [DEKR]|{P}</option>
+ <option value="[R]__pc__{P}">argc - [R]|{P}</option>
+ <option value="[X]__pc__[D]">aspn - [X]|[D]</option>
+ <option value="[FLMWY]__pc__{P}">chymotrypsin - [FLMWY]|{P}</option>
+ <option value="[R]__pc__[X]">clostripain - [R]|[X]</option>
+ <option value="[M]__pc__{X}">cnbr - [M]|{X}</option>
+ <option value="[AGILV]__pc__{P}">elastase - [AGILV]|{P}</option>
+ <option value="[D]__pc__{P}">formicacid - [D]|{P}</option>
+ <option value="[DE]__pc__{P}">gluc - [DE]|{P}</option>
+ <option value="[E]__pc__{P}">gluc_bicarb - [E]|{P}</option>
+ <option value="[W]__pc__[X]">iodosobenzoate - [W]|[X]</option>
+ <option value="[K]__pc__{P}">lysc - [K]|{P}</option>
+ <option value="[K]__pc__[X]">lysc-p - [K]|[X]</option>
+ <option value="[X]__pc__[K]">lysn - [X]|[K]</option>
+ <option value="[X]__pc__[AKRS]">lysn_promisc - [X]|[AKRS]</option>
+ <option value="[X]__pc__[X]">nonspecific - [X]|[X]</option>
+ <option value="[FL]__pc__[X]">pepsina - [FL]|[X]</option>
+ <option value="[P]__pc__[X]">protein_endopeptidase - [P]|[X]</option>
+ <option value="[E]__pc__[X]">staph_protease - [E]|[X]</option>
+ <option value="[FMWY]__pc__{P},[KR]__pc__{P},[X]__pc__[D]">tca - [FMWY]|{P},[KR]|{P},[X]|[D]</option>
+ <option value="[KR]__pc__{P}" selected="true">trypsin - [KR]|{P}</option>
+ <option value="[FKLMRWY]__pc__{P}">trypsin/chymotrypsin - [FKLMRWY]|{P}</option>
+ <option value="[KR]__pc__{P},[M]__pc__{P}">trypsin/cnbr - [KR]|{P},[M]|{P}</option>
+ <option value="[DEKR]__pc__{P}">trypsin_gluc - [DEKR]|{P}</option>
  </param>
 
 
- <param name="fragment_ion_tol" help="Fragment Ion Tolerance in Daltons" type="float" value="0.65" min="0" max="10000" label="Fragment ion tolerance"/>
+ <param name="fragment_ion_tol" help="Fragment Ion Tolerance in Daltons" type="float" value="0.5" min="0" max="10000" label="Fragment ion tolerance"/>
 
- <param name="precursor_ion_tol" help="Precursor Ion Tolerance (Da or ppm)" type="float" value="100" min="0" max="10000" label="Precursor ion tolerance"/>
+ <param name="precursor_ion_tol" help="Precursor Ion Tolerance (Da or ppm)" type="float" value="10" min="0" max="10000" label="Precursor ion tolerance"/>
  <param name="precursor_tolu" type="select" format="text">
      <label>Precursor Ion Tolerance Units</label>
      <option value="ppm">ppm</option>
  <option value="Da">Da</option>
  </param>
 
- <param name="allow_multi_isotope_search" type="boolean" label="Allow multi-isotope search" help="This allows peptide candidates in windows around -1 Da and -2 Da from the acquired mass to be considered. Only applicable when the minus/plus window above is set to less than 0.5 Da. Good for accurate-mass instruments for which the reported precursor mass is not corrected to the monoisotopic mass." truevalue="" falsevalue=""/>
+ <param name="allow_multi_isotope_search" type="boolean" label="Allow multi-isotope search" help="This allows peptide candidates in windows around -1 Da and -2 Da from the acquired mass to be considered. Only applicable when the minus/plus window above is set to less than 0.5 Da. Good for accurate-mass instruments for which the reported precursor mass is not corrected to the monoisotopic mass." truevalue="--multi-isotope-search" falsevalue=""/>
 
  </inputs>
 
@@ -187,7 +188,19 @@
  <data format="tandem" name="output" metadata_source="input_file" label="X!Tandem_vs_${database.dbkey if $database.has_key('dbkey') else $database.fasta_file.display_name}.${input_file.display_name}.${input_file.display_name}.tandem"/>
  </outputs>
 
-
+ <tests>
+ <!-- Just test that the tool runs and produces vaguely correct output -->
+ <test>
+     <param name="source_select" value="input_ref"/>
+     <param name="fasta_file" value="testdb.fasta" format="fasta"/>
+     <param name="input_file" value="tiny.mzML" format="mzml"/>
+     <output name="output" format="tandem">
+         <assert_contents>
+ <has_text text="tandem-style" />
+         </assert_contents>
+     </output>
+ </test>
+ </tests>
   <help>
 
 **What it does**
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 tandem_to_pepxml.xml
--- a/tandem_to_pepxml.xml Tue Jul 01 11:06:33 2014 -0400
+++ b/tandem_to_pepxml.xml Thu Mar 26 19:53:53 2015 -0400
b
@@ -1,25 +1,38 @@
-<tool id="tandem_to_pepxml_1" name="Tandem to pepXML" version="1.0.1">
+<tool id="tandem_to_pepxml_1" name="Tandem to pepXML" version="1.1.0">
  <requirements>
-     <requirement type="package" version="1.3.0">protk</requirement>
-     <requirement type="package" version="4.6.3">trans_proteomic_pipeline</requirement>
-   </requirements>
+         <container type="docker">iracooke/protk-1.4.1</container>
+     <requirement type="package" version="1.4">protk</requirement>
+     <requirement type="package" version="4.8.0">trans_proteomic_pipeline</requirement>
+    </requirements>
 
-  <description>Converts a tandem result file to pepXML</description>
+ <description>Converts a tandem result file to pepXML</description>
 
-<command>
- tandem_to_pepxml.rb $input_file -o $output 
-</command>
+ <command>
+ tandem_to_pepxml.rb $input_file -o $output 
+ </command>
+
+ <inputs>
+ <param name="input_file" type="data" format="tandem" multiple="false" label="Input File" help="X!Tandem results file"/>
+ </inputs>
 
-<inputs>
- <param name="input_file" type="data" format="tandem" multiple="false" label="Input File" help="X!Tandem results file"/>
-</inputs>
+ <outputs>
+ <data format="raw_pepxml" metadata_source="input_file" name="output" label="${input_file.display_name}.pepXML" />
+ </outputs>
+
+ <help>
+ Convert X!Tandem results to pepXML
+ </help>
 
-<outputs>
- <data format="raw_pepxml" metadata_source="input_file" name="output" label="${input_file.display_name}.pepXML" />
-</outputs>
-
-<help>
- Convert X!Tandem results to pepXML
-</help>
+ <tests>
+ <!-- Just test that the tool runs and produces vaguely correct output -->
+ <test>
+     <param name="input_file" value="tandem_to_pepxml_test.tandem" format="tandem"/>
+     <output name="output" format="raw_pepxml">
+         <assert_contents>
+ <has_text text="SQVFQLESTFDV" />
+         </assert_contents>
+     </output>
+ </test>
+ </tests>
 
 </tool>
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 test-data/tandem_to_pepxml_test.tandem
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/tandem_to_pepxml_test.tandem Thu Mar 26 19:53:53 2015 -0400
b
b'@@ -0,0 +1,1145 @@\n+<?xml version="1.0"?>\n+<?xml-stylesheet type="text/xsl" href="tandem-style.xsl"?>\n+<bioml xmlns:GAML="http://www.bioml.com/gaml/" label="models from \'/Users/icooke/Desktop/iptest/mr176-BSA100fmole_BA3_01_8167.d.mgf\'">\n+<group id="1" mh="1443.700944" z="2" rt="" expect="5.9e-02" label="tr|O16132|O16132_HYDVU NK-2 class homeobox transcription factor OS=Hydra vulgaris..." type="model" sumI="3.89" maxI="899" fI="8.99" act="0" >\n+<protein expect="-1.2" id="1.1" uid="14" label="tr|O16132|O16132_HYDVU NK-2 class homeobox transcription factor OS=Hydra vulgaris..." sumI="4.77" >\n+<note label="description">tr|O16132|O16132_HYDVU NK-2 class homeobox transcription factor OS=Hydra vulgaris GN=CnNK-2 PE=2 SV=1</note>\n+<file type="peptide" URL="/Users/icooke/Desktop/iptest/AASequences.fasta"/>\n+<peptide start="1" end="328">\n+\t\n+<domain id="1.1.1" start="257" end="269" expect="5.9e-02" mh="1379.728" delta="63.973" hyperscore="24.9" nextscore="22.2" y_score="13.5" y_ions="6" b_score="0.0" b_ions="0" pre="FQHR" post="DVCL" seq="NVPVLVQNNQVSS" missed_cleavages="0">\n+</domain>\n+</peptide>\n+</protein>\n+</group>\n+<group id="2" mh="1249.669838" z="3" rt="" expect="1.9e+00" label="sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2..." type="model" sumI="3.67" maxI="388" fI="3.88" act="0" >\n+<protein expect="0.0" id="2.1" uid="19" label="sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2..." sumI="5.26" >\n+<note label="description">sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2 SV=1</note>\n+<file type="peptide" URL="/Users/icooke/Desktop/iptest/AASequences.fasta"/>\n+<peptide start="1" end="741">\n+\t\n+<domain id="2.1.1" start="87" end="96" expect="1.9e+00" mh="1210.479" delta="39.191" hyperscore="21.6" nextscore="20.0" y_score="8.8" y_ions="4" b_score="9.8" b_ions="5" pre="NHAQ" post="SKKD" seq="EQSSEENFCR" missed_cleavages="0">\n+</domain>\n+</peptide>\n+</protein>\n+</group>\n+<group id="3" mh="1399.715504" z="2" rt="" expect="9.9e-02" label="tr|Q90853|Q90853_CHICK Homeobox protein OS=Gallus gallus GN=GH6 PE=2 SV=1" type="model" sumI="3.56" maxI="786" fI="7.86" act="0" >\n+<protein expect="-1.0" id="3.1" uid="16" label="tr|Q90853|Q90853_CHICK Homeobox protein OS=Gallus gallus GN=GH6 PE=2 SV=1" sumI="4.91" >\n+<note label="description">tr|Q90853|Q90853_CHICK Homeobox protein OS=Gallus gallus GN=GH6 PE=2 SV=1</note>\n+<file type="peptide" URL="/Users/icooke/Desktop/iptest/AASequences.fasta"/>\n+<peptide start="1" end="368">\n+\t\n+<domain id="3.1.1" start="208" end="219" expect="9.9e-02" mh="1381.663" delta="18.052" hyperscore="23.9" nextscore="19.3" y_score="7.6" y_ions="5" b_score="9.6" b_ions="4" pre="VFSR" post="KRYL" seq="SQVFQLESTFDV" missed_cleavages="0">\n+</domain>\n+</peptide>\n+</protein>\n+</group>\n+<group id="4" mh="1452.636818" z="3" rt="" expect="2.2e+00" label="sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2..." type="model" sumI="3.39" maxI="389" fI="3.89" act="0" >\n+<protein expect="0.0" id="4.1" uid="19" label="sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2..." sumI="5.26" >\n+<note label="description">sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2 SV=1</note>\n+<file type="peptide" URL="/Users/icooke/Desktop/iptest/AASequences.fasta"/>\n+<peptide start="1" end="741">\n+\t\n+<domain id="4.1.1" start="589" end="600" expect="2.2e+00" mh="1413.614" delta="39.022" hyperscore="20.2" nextscore="19.4" y_score="10.9" y_ions="4" b_score="9.6" b_ions="3" pre="NNFK" post="FNEL" seq="SMLPGNFENPYF" missed_cleavages="0">\n+<aa type="M" at="590" modified="15.99492" />\n+</domain>\n+</peptide>\n+</protein>\n+</group>\n+<group id="5" mh="1399.717238" z="3" rt="" expect="1.1e+00" label="sp|O93590|ZAX_XENLA Homeobox protein zampogna OS=Xenopus laevis GN=zax PE=2 SV=1" type="model" sumI="4.15" maxI="2944" fI="29.44" act="0" >\n+<protein expect="0.0" id="5.1" uid="15" lab'..b'ites">2</note>\n+\t<note type="input" label="scoring, minimum ion count">4</note>\n+\t<note type="input" label="scoring, x ions">no</note>\n+\t<note type="input" label="scoring, y ions">yes</note>\n+\t<note type="input" label="scoring, z ions">no</note>\n+\t<note type="input" label="spectrum, dynamic range">100.0</note>\n+\t<note type="input" label="spectrum, fragment mass type">monoisotopic</note>\n+\t<note type="input" label="spectrum, fragment monoisotopic mass error">0.4</note>\n+\t<note type="input" label="spectrum, fragment monoisotopic mass error units">Daltons</note>\n+\t<note type="input" label="spectrum, maximum parent charge">5</note>\n+\t<note type="input" label="spectrum, minimum fragment mz">50.0</note>\n+\t<note type="input" label="spectrum, minimum parent m+h">600.0</note>\n+\t<note type="input" label="spectrum, minimum peaks">6</note>\n+\t<note type="input" label="spectrum, parent monoisotopic mass error minus">100.0</note>\n+\t<note type="input" label="spectrum, parent monoisotopic mass error plus">100.0</note>\n+\t<note type="input" label="spectrum, parent monoisotopic mass error units">Daltons</note>\n+\t<note type="input" label="spectrum, parent monoisotopic mass isotope error">no</note>\n+\t<note type="input" label="spectrum, path">/Users/icooke/Desktop/iptest/mr176-BSA100fmole_BA3_01_8167.d.mgf</note>\n+\t<note type="input" label="spectrum, sequence batch size">1000</note>\n+\t<note type="input" label="spectrum, threads">1</note>\n+\t<note type="input" label="spectrum, total peaks">50</note>\n+\t<note type="input" label="spectrum, use conditioning">yes</note>\n+\t<note type="input" label="spectrum, use noise suppression">no</note>\n+</group>\n+<group label="unused input parameters"  type="parameters">\n+\t<note type="input" label="protein, use minimal annotations">yes</note>\n+\t<note type="input" label="refine, modification mass"></note>\n+\t<note type="input" label="refine, point mutations">no</note>\n+\t<note type="input" label="refine, potential C-terminus modifications"></note>\n+\t<note type="input" label="refine, potential N-terminus modifications"></note>\n+\t<note type="input" label="refine, potential modification mass"></note>\n+\t<note type="input" label="refine, potential modification motif"></note>\n+\t<note type="input" label="refine, tic percent">10</note>\n+\t<note type="input" label="refine, unanticipated cleavage">no</note>\n+\t<note type="input" label="refine, use potential modifications for full refinement">no</note>\n+\t<note type="input" label="scoring, pluggable scoring">no</note>\n+\t<note type="input" label="spectrum, maximum parent m+h">4000.0</note>\n+</group>\n+<group label="performance parameters" type="parameters">\n+\t<note label="list path, sequence source #1">/Users/icooke/Desktop/iptest/AASequences.fasta</note>\n+\t<note label="list path, sequence source description #1">no description</note>\n+\t<note label="modelling, duplicate peptide ids">0</note>\n+\t<note label="modelling, duplicate proteins">0</note>\n+\t<note label="modelling, total peptides used">528901</note>\n+\t<note label="modelling, total proteins used">33</note>\n+\t<note label="modelling, total spectra used">118</note>\n+\t<note label="process, start time">2014:06:22:13:57:04</note>\n+\t<note label="process, version">X! Tandem Sledgehammer (2013.09.01.1)</note>\n+\t<note label="quality values">6 7 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0</note>\n+\t<note label="refining, # input models">0</note>\n+\t<note label="refining, # input spectra">0</note>\n+\t<note label="refining, # partial cleavage">0</note>\n+\t<note label="refining, # point mutations">0</note>\n+\t<note label="refining, # potential C-terminii">0</note>\n+\t<note label="refining, # potential N-terminii">0</note>\n+\t<note label="refining, # unanticipated cleavage">0</note>\n+\t<note label="timing, initial modelling total (sec)">0.61</note>\n+\t<note label="timing, initial modelling/spectrum (sec)">0.0052</note>\n+\t<note label="timing, load sequence models (sec)">0.00</note>\n+\t<note label="timing, refinement/spectrum (sec)">0.0000</note>\n+</group>\n+</bioml>\n'
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 test-data/testdb.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/testdb.fasta Thu Mar 26 19:53:53 2015 -0400
b
@@ -0,0 +1,38 @@
+>sp|ALBU_BOVIN|
+MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFKGLVLIA
+FSQYLQQCPFDEHVKLVNELTEFAKTCVADESHAGCEKSLHTLFGDELCK
+VASLRETYGDMADCCEKQEPERNECFLSHKDDSPDLPKLKPDPNTLCDEF
+KADEKKFWGKYLYEIARRHPYFYAPELLYYANKYNGVFQECCQAEDKGAC
+LLPKIETMREKVLASSARQRLRCASIQKFGERALKAWSVARLSQKFPKAE
+FVEVTKLVTDLTKVHKECCHGDLLECADDRADLAKYICDNQDTISSKLKE
+CCDKPLLEKSHCIAEVEKDAIPENLPPLTADFAEDKDVCKNYQEAKDAFL
+GSFLYEYSRRHPEYAVSVLLRLAKEYEATLEECCAKDDPHACYSTVFDKL
+KHLVDEPQNLIKQNCDQFEKLGEYGFQNALIVRYTRKVPQVSTPTLVEVS
+RSLGKVGTRCCTKPESERMPCTEDYLSLILNRLCVLHEKTPVSEKVTKCC
+TESLVNRRPCFSALTPDETYVPKAFDEKLFTFHADICTLPDTEKQIKKQT
+ALVELLKHKPKATEEQLKTVMENFVAFVDKCCAADDKEACFAVEGPKLVV
+STQTALA
+>sp|AMYS_HUMAN|
+MKLFWLLFTIGFCWAQYSSNTQQGRTSIVHLFEWRWVDIALECERYLAPK
+GFGGVQVSPPNENVAIHNPFRPWWERYQPVSYKLCTRSGNEDEFRNMVTR
+CNNVGVRIYVDAVINHMCGNAVSAGTSSTCGSYFNPGSRDFPAVPYSGWD
+FNDGKCKTGSGDIENYNDATQVRDCRLSGLLDLALGKDYVRSKIAEYMNH
+LIDIGVAGFRIDASKHMWPGDIKAILDKLHNLNSNWFPEGSKPFIYQEVI
+DLGGEPIKSSDYFGNGRVTEFKYGAKLGTVIRKWNGEKMSYLKNWGEGWG
+FMPSDRALVFVDNHDNQRGHGAGGASILTFWDARLYKMAVGFMLAHPYGF
+TRVMSSYRWPRYFENGKDVNDWVGPPNDNGVTKEVTINPDTTCGNDWVCE
+HRWRQIRNMVNFRNVVDGQPFTNWYDNGSNQVAFGRGNRGFIVFNNDDWT
+FSLTLQTGLPAGTYCDVISGDKINGNCTGIKIYVSDDGKAHFSISNSAED
+PFIAIHAESKL
+>sp|CAS1_BOVIN|
+MKLLILTCLVAVALARPKHPIKHQGLPQEVLNENLLRFFVAPFPEVFGKE
+KVNELSKDIGSESTEDQAMEDIKQMEAESISSSEEIVPNSVEQKHIQKED
+VPSERYLGYLEQLLRLKKYKVPQLEIVPNSAEERLHSMKEGIHAQQKEPM
+IGVNQELAYFYPELFRQFYQLDAYPSGAWYYVPLGTQYTDAPSFSDIPNP
+IGSENSEKTTMPLW
+>sp|CAS2_BOVIN|
+MKFFIFTCLLAVALAKNTMEHVSSSEESIISQETYKQEKNMAINPSKENL
+CSTFCKEVVRNANEEEYSIGSSSEESAEVATEEVKITVDDKHYQKALNEI
+NQFYQKFPQYLQYLYQGPIVLNPWDQVKRNAVPITPTLNREQLSTSEENS
+KKTVDMESTEVFTKKTKLTEEEKNRLNFLKKISQRYQKFALPQYLKTVYQ
+HQKAMKPWIQPKTKVIPYVRYL
\ No newline at end of file
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 test-data/tiny.mzML
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/tiny.mzML Thu Mar 26 19:53:53 2015 -0400
b
b'@@ -0,0 +1,317 @@\n+<?xml version="1.0" encoding="ISO-8859-1"?>\n+<indexedmzML xmlns="http://psi.hupo.org/ms/mzml" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://psi.hupo.org/ms/mzml http://psidev.info/files/ms/mzML/xsd/mzML1.1.1_idx.xsd">\n+  <mzML xmlns="http://psi.hupo.org/ms/mzml" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://psi.hupo.org/ms/mzml http://psidev.info/files/ms/mzML/xsd/mzML1.1.0.xsd" id="tiny" version="1.1.0">\n+    <cvList count="2">\n+      <cv id="MS" fullName="Proteomics Standards Initiative Mass Spectrometry Ontology" version="3.7.3" URI="http://psidev.cvs.sourceforge.net/*checkout*/psidev/psi/psi-ms/mzML/controlledVocabulary/psi-ms.obo"/>\n+      <cv id="UO" fullName="Unit Ontology" version="18:03:2011" URI="http://obo.cvs.sourceforge.net/*checkout*/obo/obo/ontology/phenotype/unit.obo"/>\n+    </cvList>\n+    <fileDescription>\n+      <fileContent>\n+        <cvParam cvRef="MS" accession="MS:1000579" name="MS1 spectrum" value=""/>\n+        <cvParam cvRef="MS" accession="MS:1000580" name="MSn spectrum" value=""/>\n+        <cvParam cvRef="MS" accession="MS:1000127" name="centroid spectrum" value=""/>\n+      </fileContent>\n+      <sourceFileList count="2">\n+        <sourceFile id="sourceFile" name="ANALYSIS.BAF" location="Q:/Data/MALDI/1110/MT573/Tilo%20Knobs%20S2_BAF.d">\n+          <cvParam cvRef="MS" accession="MS:1000772" name="Bruker BAF nativeID format" value=""/>\n+          <cvParam cvRef="MS" accession="MS:1000815" name="Bruker BAF file" value=""/>\n+          <cvParam cvRef="MS" accession="MS:1000569" name="SHA-1" value="2107bc8ebc6160293e3c95b1848d4afa96435c39"/>\n+        </sourceFile>\n+        <sourceFile id="tiny.mzML" name="tiny.mzML" location="file://.">\n+          <cvParam cvRef="MS" accession="MS:1000569" name="SHA-1" value="c52beeb6ca5b6865b55e67b919317a96a064854b"/>\n+        </sourceFile>\n+      </sourceFileList>\n+      <contact>\n+        <cvParam cvRef="MS" accession="MS:1000586" name="contact name" value=" pfaou"/>\n+        <cvParam cvRef="MS" accession="MS:1000590" name="contact organization" value=""/>\n+      </contact>\n+    </fileDescription>\n+    <sampleList count="1">\n+      <sample id="sample" name="">\n+      </sample>\n+    </sampleList>\n+    <softwareList count="3">\n+      <software id="exportSoftware" version="3.0.1">\n+        <cvParam cvRef="MS" accession="MS:1000717" name="CompassXport" value=""/>\n+      </software>\n+      <software id="instrumentSoftware" version="3.3.85.0">\n+        <cvParam cvRef="MS" accession="MS:1000692" name="Bruker software" value=""/>\n+        <userParam name="AcquisitionProgram" value="flexControl"/>\n+      </software>\n+      <software id="pwiz_2.2.0_x0020__x0028_TPP_x0020_v4.6_x0020_OCCUPY_x0020_rev_x0020_1_x002c__x0020_Build_x0020_201210300824_x0020__x0028_linux_x0029__x0029_" version="2.2.0 (TPP v4.6 OCCUPY rev 1, Build 201210300824 (linux))">\n+        <cvParam cvRef="MS" accession="MS:1000615" name="ProteoWizard" value=""/>\n+      </software>\n+    </softwareList>\n+    <instrumentConfigurationList count="1">\n+      <instrumentConfiguration id="instrument">\n+        <cvParam cvRef="MS" accession="MS:1000705" name="ultraflex III TOF/TOF" value=""/>\n+        <componentList count="3">\n+          <source order="1">\n+            <cvParam cvRef="MS" accession="MS:1000075" name="matrix-assisted laser desorption ionization" value=""/>\n+          </source>\n+          <analyzer order="2">\n+            <cvParam cvRef="MS" accession="MS:1000084" name="time-of-flight" value=""/>\n+          </analyzer>\n+          <detector order="3">\n+            <cvParam cvRef="MS" accession="MS:1000026" name="detector type" value=""/>\n+          </detector>\n+        </componentList>\n+        <softwareRef ref="instrumentSoftware"/>\n+      </instrumentConfiguration>\n+    </instrumentConfigurationList>\n+    <dataProcessingList count="2">\n+      <dataProcessing id="exportation">\n+        <processingMethod order="1" software'..b'85" name="total ion current" value="31088.32173543"/>\n+          <cvParam cvRef="MS" accession="MS:1000504" name="base peak m/z" value="1488.98220680" unitCvRef="MS" unitAccession="MS:1000040" unitName="m/z"/>\n+          <cvParam cvRef="MS" accession="MS:1000505" name="base peak intensity" value="9322.68373807" unitCvRef="MS" unitAccession="MS:1000131" unitName="number of counts"/>\n+          <cvParam cvRef="MS" accession="MS:1000511" name="ms level" value="2"/>\n+          <cvParam cvRef="MS" accession="MS:1000527" name="highest observed m/z" value="1491.24548135" unitCvRef="MS" unitAccession="MS:1000040" unitName="m/z"/>\n+          <cvParam cvRef="MS" accession="MS:1000528" name="lowest observed m/z" value="59.96272840" unitCvRef="MS" unitAccession="MS:1000040" unitName="m/z"/>\n+          <scanList count="1">\n+            <cvParam cvRef="MS" accession="MS:1000795" name="no combination" value=""/>\n+            <scan>\n+              <cvParam cvRef="MS" accession="MS:1000016" name="scan start time" value="87.8333" unitCvRef="UO" unitAccession="UO:0000031" unitName="minute"/>\n+            </scan>\n+          </scanList>\n+          <precursorList count="1">\n+            <precursor>\n+              <selectedIonList count="1">\n+                <selectedIon>\n+                  <cvParam cvRef="MS" accession="MS:1000744" name="selected ion m/z" value="1489.86" unitCvRef="MS" unitAccession="MS:1000040" unitName="m/z"/>\n+                </selectedIon>\n+              </selectedIonList>\n+              <activation>\n+                <cvParam cvRef="MS" accession="MS:1000044" name="dissociation method" value=""/>\n+              </activation>\n+            </precursor>\n+          </precursorList>\n+          <binaryDataArrayList count="2">\n+            <binaryDataArray encodedLength="512">\n+              <cvParam cvRef="MS" accession="MS:1000523" name="64-bit float" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000576" name="no compression" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000514" name="m/z array" value="" unitCvRef="MS" unitAccession="MS:1000040" unitName="m/z"/>\n+              <binary>AAAAoDr7TUAAAABA4U5TQAAAAKDOjFRAAAAAYBR9VUAAAACATqJYQAAAAICzeFlAAAAAoEN6W0AAAABgNflbQAAAAKDet1xAAAAAYM0WX0AAAABg/RtgQAAAAGDGVGBAAAAAQDQ5YUAAAACgC1piQAAAAICxOGNAAAAAAP7YY0AAAABAxxhlQAAAAKB6d2VAAAAAgDnYZUAAAACA/TdmQAAAACCTlmhAAAAAYF6UakAAAADglTRsQAAAAIDVk2xAAAAAQKAJcEAAAABAE6pxQAAAAKD3x3FAAAAAQLb4cUAAAABg4dV0QAAAAEDh03lAAAAAgBoBgEAAAACgj96DQAAAACB8o5VAAAAAwJp/lkAAAABg9o2WQAAAAGBQl5ZAAAAAgJ2glkAAAAAgIr+WQAAAAIDZ5JZAAAAAwL/wlkAAAACgFvqWQAAAAIDlBJdAAAAAINQQl0AAAACgzB6XQAAAAAAFLJdAAAAAYLg1l0AAAADA7UOXQAAAAGD7TJdA</binary>\n+            </binaryDataArray>\n+            <binaryDataArray encodedLength="256">\n+              <cvParam cvRef="MS" accession="MS:1000521" name="32-bit float" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000576" name="no compression" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000515" name="intensity array" value="" unitCvRef="MS" unitAccession="MS:1000131" unitName="number of counts"/>\n+              <binary>DykLQ5jS4kJ0ggxDC8pKQ/sT+0JBi/xC6V0RQ+8nhUOldBFD3dHoQm+cI0N9sgxDumcAQ3Zc8UKzwLNDiQUTQ8XNIUONE1lD3Q+gQ9aVJkPvReFD/Q4uQ2eyZkMvRitDeOMTQ8E0cUNzSotDWOkdQ83tfkP1u6xDDTHOQ575v0P4BVlDlp+dQ1Fkq0PCvJVDx2SfQ3ams0PnGgpENKcMRDawDkTCaiJEuCkyRLUbA0WRVBtFWFIdRbyqEUbw0T9F</binary>\n+            </binaryDataArray>\n+          </binaryDataArrayList>\n+        </spectrum>\n+      </spectrumList>\n+    </run>\n+  </mzML>\n+  <indexList count="2">\n+    <index name="spectrum">\n+      <offset idRef="scan=1">4983</offset>\n+      <offset idRef="scan=2">7468</offset>\n+      <offset idRef="scan=3">9985</offset>\n+      <offset idRef="scan=4">12475</offset>\n+      <offset idRef="scan=5">17113</offset>\n+      <offset idRef="scan=6">21331</offset>\n+    </index>\n+  </indexList>\n+  <indexListOffset>25171</indexListOffset>\n+  <fileChecksum>0a78dcf8705de44cf7673d1a237899b2eec9bafe</fileChecksum>\n+</indexedmzML>\n'
b
diff -r c60d1f18fd85 -r 9d6e0ad4d600 tool-data/tandem_mods.loc.sample
--- a/tool-data/tandem_mods.loc.sample Tue Jul 01 11:06:33 2014 -0400
+++ b/tool-data/tandem_mods.loc.sample Thu Mar 26 19:53:53 2015 -0400
[
@@ -3,4 +3,5 @@
 #
 Carbamidomethyl C carbamidomethyl_c_ 57.021464@C carbamidomethyl_c_
 Glycocapture-N glycocapture_n_ 0.998@N!{P}[ST] glycocapture_n_
-Oxidation M oxidation_m_ 15.994915@M oxidation_m_
\ No newline at end of file
+Oxidation M oxidation_m_ 15.994915@M oxidation_m_
+Biotin K biotin_k_ 226.077598@K biotin_k_
\ No newline at end of file