Repository 'pepquery2'
hg clone https://toolshed.g2.bx.psu.edu/repos/galaxyp/pepquery2

Changeset 0:a07976bbc4d9 (2022-11-06)
Next changeset 1:b5489f81c2fa (2023-10-18)
Commit message:
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/pepquery2 commit 00e1b1770d0b1f9fe31384b37b55f7ae9d97b597
added:
macros.xml
pepquery2.xml
test-data/AgilentMassHunterTest.mzXML
test-data/Uniprot.fasta
test-data/iTRAQ_f4.mgf
test-data/immunopeptidomics.mgf
test-data/novel_peptides
test-data/novel_proteins.fa
test-data/pep.txt
test-data/small-index-filter.mzML
b
diff -r 000000000000 -r a07976bbc4d9 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Sun Nov 06 16:25:25 2022 +0000
[
b'@@ -0,0 +1,1302 @@\n+ <macros>\n+    <token name="@TOOL_VERSION@">2.0.2</token>\n+    <token name="@VERSION_SUFFIX@">0</token>\n+    <xml name="citations">\n+        <citations>\n+            <citation type="doi">10.1101/gr.235028.118</citation>\n+            <citation type="doi">10.1038/s41467-020-15456-w</citation>\n+        </citations>\n+    </xml>\n+    <token name="@PEPQUERY_DOCUMANTATION_URL@">http://pepquery.org/document.html</token>\n+\n+    <token name="@CMD_IMPORTS@">\n+#import re\n+#import os.path\n+#def identifier_or_name($input1)\n+    #if hasattr($input1, \'element_identifier\')\n+        #return $input1.element_identifier\n+    #else\n+        #return $input1.name\n+    #end if\n+#end def\n+#def clean($name1)\n+    #set $name_clean = $re.sub(\'[^\\w\\-_]\', \'_\', $re.sub(\'(?i)[.](fa|fas|fasta|imzml|mzml|mzxml|mgf|raw)$\',\'\', $re.sub(\'.*/\',\'\', $name1.rstrip(\'.gz\'))))\n+    #return $name_clean\n+#end def\n+#def ln_name($ds)\n+    #set $ext = \'\'\n+    #if $ds.is_of_type(\'mzml\') or $ds.is_of_type(\'imzml\')\n+        #set $ext = ".mzML"\n+    #else if $ds.is_of_type(\'mzxml\')\n+        #set $ext = ".mzXML"\n+    #else if $ds.is_of_type(\'mgf\')\n+        #set $ext = ".mgf"\n+    #else if $ds.is_of_type(\'thermo.raw\')\n+        #set $ext = ".raw"\n+    #else if $ds.is_of_type(\'fasta\')\n+        #set $ext = ".fasta"\n+    #end if\n+    #set $name = "%s%s" % ($clean($identifier_or_name($ds)),$ext)\n+    #return $name\n+#end def\n+    </token>\n+\n+    <token name="@INDEX_SPECTRUM_FILES@"><![CDATA[\n+#def index_spectrum_files($idx_dir,$spectrum_files)\n+#set global $input_dir = \'input_dir\'\n+#set global $index_dir = \'index_dir\'\n+mkdir -p $input_dir &&\n+#if $idx_dir\n+mkdir -p $idx_dir &&\n+ln -s $idx_dir $index_dir &&\n+#else\n+mkdir -p $index_dir &&\n+#end if\n+#if isinstance($spectrum_files, list)\n+   #set $sfiles = $spectrum_files\n+#else\n+  #set $sfiles = [$spectrum_files]\n+#end if\n+#for $sf in $sfiles\n+  #set $i_name = $ln_name($sf)\n+  #set $p_name = $os.path.join($input_dir, $i_name)\n+  ln -s \'$sf\' \'$p_name\' &&\n+#end for\n+pepquery index -i input_dir -o index_dir\n+#end def\n+    ]]></token>\n+\n+    <xml name="pepquerydb_options">\n+                        <option value="all">all</option>\n+                        <option value="w">w:global proteome</option>\n+                        <option value="p">p:phosphorylation</option>\n+                        <option value="a">a:acetylation</option>\n+                        <option value="u">u:ubiquitination</option>\n+                        <option value="g">g:glycosylation</option>\n+                        <option value="Academia_Sinica_LUAD100_Phosphoproteome_PDC000220">Academia_Sinica_LUAD100_Phosphoproteome_PDC000220</option>\n+                        <option value="Academia_Sinica_LUAD100_Proteome_PDC000219">Academia_Sinica_LUAD100_Proteome_PDC000219</option>\n+                        <option value="CCLE_proteome_MSV000085836">CCLE_proteome_MSV000085836</option>\n+                        <option value="CPTAC">CPTAC</option>\n+                        <option value="CPTAC_CCRCC_Discovery_Study_Phosphoproteme_PDC000128">CPTAC_CCRCC_Discovery_Study_Phosphoproteme_PDC000128</option>\n+                        <option value="CPTAC_CCRCC_Discovery_Study_Proteome_PDC000127">CPTAC_CCRCC_Discovery_Study_Proteome_PDC000127</option>\n+                        <option value="CPTAC_GBM_Discovery_Study_Acetylome_PDC000245">CPTAC_GBM_Discovery_Study_Acetylome_PDC000245</option>\n+                        <option value="CPTAC_GBM_Discovery_Study_Phosphoproteome_PDC000205">CPTAC_GBM_Discovery_Study_Phosphoproteome_PDC000205</option>\n+                        <option value="CPTAC_GBM_Discovery_Study_Proteome_PDC000204">CPTAC_GBM_Discovery_Study_Proteome_PDC000204</option>\n+                        <option value="CPTAC_HNSCC_Discovery_Study_Phosphoproteome_PDC000222">CPTAC_HNSCC_Discovery_Study_Phosphoproteome_PDC000222</option>\n+                        <option value="CPTAC_HNSCC_Discovery_Study_Proteome_PDC000221">CPTAC_HNSCC_Discovery_Study_Proteome_PDC000221</optio'..b'735]</option>\n+        <option value="1122">1122: Trimethyl of K [42.04695]</option>\n+        <option value="1123">1123: Trimethyl of protein A [42.04695]</option>\n+        <option value="1124">1124: Trimethyl of R [42.04695]</option>\n+        <option value="1125">1125: Trimethyl:13C(3)2H(9) of K [54.113505]</option>\n+        <option value="1126">1126: Trimethyl:13C(3)2H(9) of R [54.113505]</option>\n+        <option value="1127">1127: Trimethyl:2H(9) of K [51.103441]</option>\n+        <option value="1128">1128: Trimethyl:2H(9) of R [51.103441]</option>\n+        <option value="1129">1129: Trioxidation of W [47.984744]</option>\n+        <option value="1130">1130: Trioxidation of Y [47.984744]</option>\n+        <option value="1131">1131: Tris of N [104.071154]</option>\n+        <option value="1132">1132: Triton of C-term [188.156501]</option>\n+        <option value="1133">1133: Triton of N-term [188.156501]</option>\n+        <option value="1134">1134: Trp->Hydroxykynurenin of W [19.989829]</option>\n+        <option value="1135">1135: Trp->Kynurenin of W [3.994915]</option>\n+        <option value="1136">1136: Trp->Oxolactone of W [13.979265]</option>\n+        <option value="1137">1137: Tween20 of N-term [165.164326]</option>\n+        <option value="1138">1138: Tyr->Dha of Y [-94.041865]</option>\n+        <option value="1139">1139: Ub-amide of C [196.108602]</option>\n+        <option value="1140">1140: Ub-Br2 of C [100.063663]</option>\n+        <option value="1141">1141: Ub-VME of C [173.092617]</option>\n+        <option value="1142">1142: UgiJoullieProGly of D [154.074228]</option>\n+        <option value="1143">1143: UgiJoullieProGly of E [154.074228]</option>\n+        <option value="1144">1144: Xlink:BMOE of C [220.048407]</option>\n+        <option value="1145">1145: Xlink:DFDNB of K [203.998263]</option>\n+        <option value="1146">1146: Xlink:DFDNB of N [203.998263]</option>\n+        <option value="1147">1147: Xlink:DFDNB of Q [203.998263]</option>\n+        <option value="1148">1148: Xlink:DFDNB of R [203.998263]</option>\n+        <option value="1149">1149: Xlink:DMP of K [122.084398]</option>\n+        <option value="1150">1150: Xlink:DMP of protein N-term [122.084398]</option>\n+        <option value="1151">1151: Xlink:DMP-de of K [140.094963]</option>\n+        <option value="1152">1152: Xlink:DMP-de of protein N-term [140.094963]</option>\n+        <option value="1153">1153: Xlink:DMP-s of K [154.110613]</option>\n+        <option value="1154">1154: Xlink:DMP-s of protein N-term [154.110613]</option>\n+        <option value="1155">1155: Xlink:DSS of K [156.078644]</option>\n+        <option value="1156">1156: Xlink:DSS of protein N-term [156.078644]</option>\n+        <option value="1157">1157: Xlink:DSS-NH2 of K [155.094629]</option>\n+        <option value="1158">1158: Xlink:DSS-NH2 of protein N-term [155.094629]</option>\n+        <option value="1159">1159: Xlink:DST of K [132.005873]</option>\n+        <option value="1160">1160: Xlink:DST of protein N-term [132.005873]</option>\n+        <option value="1161">1161: Xlink:DTBPc of K [87.01427]</option>\n+        <option value="1162">1162: Xlink:DTBPc of N [87.01427]</option>\n+        <option value="1163">1163: Xlink:DTBPc of protein N-term [87.01427]</option>\n+        <option value="1164">1164: Xlink:DTBPc of Q [87.01427]</option>\n+        <option value="1165">1165: Xlink:DTBPc of R [87.01427]</option>\n+        <option value="1166">1166: Xlink:DTSSP of K [191.991486]</option>\n+        <option value="1167">1167: Xlink:DTSSP of protein N-term [191.991486]</option>\n+        <option value="1168">1168: Xlink:EGS115 of K [115.026943]</option>\n+        <option value="1169">1169: Xlink:EGS115 of protein N-term [115.026943]</option>\n+        <option value="1170">1170: Xlink:EGS244 of K [244.058303]</option>\n+        <option value="1171">1171: Xlink:EGS244 of protein N-term [244.058303]</option>\n+        <option value="1172">1172: Xlink:SMCC of C [237.100108]</option>\n+    </xml>\n+</macros>\n'
b
diff -r 000000000000 -r a07976bbc4d9 pepquery2.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/pepquery2.xml Sun Nov 06 16:25:25 2022 +0000
[
b'@@ -0,0 +1,790 @@\n+<tool id="pepquery2" name="PepQuery2" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@">\n+    <description>Peptide-centric search engine for novel peptide identification and validation.</description>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <requirements> \n+        <requirement type="package" version="@TOOL_VERSION@">pepquery</requirement>\n+    </requirements>\n+    <stdio>\n+        <exit_code range="1:" level="fatal" description="Failed" />\n+        <regex match="Exception"\n+               source="stderr"\n+               level="fatal"\n+               description="java Exception" />\n+    </stdio>\n+    <command><![CDATA[\n+@CMD_IMPORTS@\n+#if $req_inputs.db_type.db_type_selector == \'history\'\n+  #set $db_file = $re.sub(\'\\s\',\'_\',$re.sub(\'[.][^.]*$\',\'\',$req_inputs.db_type.db_file.display_name.split(\'/\')[-1])) + ".fa"\n+  ln -s \'$req_inputs.db_type.db_file\' \'$db_file\' &&\n+#end if\n+#if $req_inputs.ms_dataset.ms_dataset_type == \'history\'\n+  @INDEX_SPECTRUM_FILES@\n+  $index_spectrum_files($ms_index.files_path, $req_inputs.ms_dataset.spectrum_files) &&\n+#elif $req_inputs.ms_dataset.ms_dataset_type == \'indexed\'\n+  #if $os.path.exists($os.path.join($req_inputs.ms_dataset.index.extra_files_path, \'summary.txt\'))\n+    #set $index_dir = \'index_dir\'\n+    ln -s \'$req_inputs.ms_dataset.index.extra_files_path\' index_dir &&\n+  #else\n+    #raise ValueError\n+  #end if\n+#end if\n+## PepQuery command\n+pepquery \n+  -Xmx\\$[ \\${GALAXY_MEMORY_MB:-8192} / 1024 ]g\n+#if $validation.task_type == "known"\n+  -s 2 $validation.decoy\n+#else\n+  -s 1\n+#end if\n+#if $req_inputs.ms_dataset.ms_dataset_type in [\'history\', \'indexed\']\n+  -ms \'$index_dir\'\n+#elif $req_inputs.ms_dataset.ms_dataset_type in [\'PepQueryDB\', \'public\']\n+  -b \'$req_inputs.ms_dataset.dataset\'             \n+#end if\n+\n+#if $req_inputs.db_type.db_type_selector == \'history\'\n+  -db \'$db_file\'\n+#else\n+  -db \'$req_inputs.db_type.db_id\' \n+#end if\n+#if $req_inputs.input_type.input_type_selector == \'peptide\'\n+  -t $req_inputs.input_type.input_type_selector\n+  -i \'$req_inputs.input_type.multiple.input\'\n+#else\n+  -t $req_inputs.input_type.input_type_selector\n+  #if $req_inputs.input_type.input_type_selector == \'protein\'\n+    #if $req_inputs.input_type.multiple.protein_input_selector == \'identifier\'\n+      #set $prot_id = str($req_inputs.input_type.multiple.input).replace(\'|\',\'\\|\')\n+      -i \'"$prot_id"\'\n+    #else\n+      -i \'$req_inputs.input_type.multiple.input\'\n+    #end if\n+  #else\n+    -i \'$req_inputs.input_type.input\'\n+    #if $req_inputs.input_type.input_type_selector == \'DNA\'\n+      #if $req_inputs.input_type.frame == \'None\'\n+        -frame \'0\'\n+      #else\n+        -frame \'$req_inputs.input_type.frame\'\n+      #end if\n+    #else\n+            -anno \'$req_inputs.input_type.anno\'\n+    #end if\n+  #end if\n+#end if\n+#if $req_inputs.indexType\n+  -indexType $req_inputs.indexType\n+#end if\n+\n+#if $modifications.fixed_mod\n+  -fixMod \'$modifications.fixed_mod\'\n+#end if\n+#if $modifications.var_mod\n+  -varMod \'$modifications.var_mod\'\n+#end if\n+#if $digestion.enzyme\n+  -e \'$digestion.enzyme\'\n+#end if\n+#if $digestion.max_missed_cleavages\n+  -c \'$digestion.max_missed_cleavages\'\n+#end if\n+\n+#if $modifications.max_mods\n+  -maxVar \'$modifications.max_mods\'\n+#end if\n+  $modifications.unmodified\n+  $modifications.aa\n+#if $ms_params.tolerance_params.precursor_tolerance\n+  -tol \'$ms_params.tolerance_params.precursor_tolerance\'\n+#end if\n+\n+#if $ms_params.tolerance_params.precursor_unit\n+  -tolu \'$ms_params.tolerance_params.precursor_unit\'\n+#end if\n+#if $ms_params.tolerance_params.tolerance\n+  -itol \'$ms_params.tolerance_params.tolerance\'\n+#end if\n+#if $ms_params.search.frag_method\n+  -fragmentMethod \'$ms_params.search.frag_method\'\n+#end if\n+#if $ms_params.search.scoring_method\n+  -m \'$ms_params.search.scoring_method\'\n+#end if\n+  $ms_params.search.extra_score_validation\n+#if $ms_params.search.max_charge\n+  -maxCharge \'$ms_params.search.max_charge\'\n+#end if\n+#if $ms_params.search.min_char'..b' identification, one of the following:\n+\n+      - Mass Spectrometry history datasets in MGF, mzML, or mzXML format \n+      - An Indexed MS/MS dataset  (from previous PepQuery2 run or from **PepQuery2 index** tool.)\n+      - PepQueryDB dataset IDs \n+        \n+        .. \n+\n+        Multiple datasets from PepQueryDB must be separated by comma. A pattern to match datasets in PepQueryDB is also supported, for example, use \'CPTAC\' to search all datasets contain \'CPTAC\'. In addition, dataset selection from PepQueryDB based on data type (w:global proteome, p:phosphorylation, a:acetylation, u:ubiquitination, g:glycosylation) is also supported. For example, use \'p\' to search all phosphoproteomics datasets in PepQueryDB.  The **PepQuery2 Show Sets** tool will list available PepQueryDB datasets.\n+\n+\n+      - Dataset IDs from public proteomics data repositories: PRIDE, MassIVE, jPOSTrepo and iProX\n+\n+        ..\n+\n+        Dataset ID from public proteomics data repositories, one dataset is supported for each analysis. For example, use \'PXD000529\' to use all MS/MS data from dataset PXD000529 or use \'PXD000529:LM3\' to use data files containing LM3 from dataset PXD000529\n+\n+    - A reference protein fasta database, novel peptides matching a reference sequence will be excluded.  \n+\n+      - A protein fasta file\n+      - The ID for a public reference protein database from RefSeq, GENCODE, Ensembl or UniProt.\n+\n+\n+**Options**\n+\n+    - MS/MS searching parameter set name \n+\n+      .. \n+\n+      Setting a *parameter set name* will change defaults for various options,  These may be overridden by manually setting the option.\n+      The **PepQuery2 Show Sets** tool *PepQuery Predefined Parameter Sets* will list those available along with the option values that will be set.\n+      The **PepQuery2 Show Sets** tool *PepQuery Datasets* column *parameter_set* column for each PepQueryDB dataset.\n+\n+\n+    - Override default options\n+\n+      .. \n+\n+      Values for modifications are provided in a select list.  \n+      The **PepQuery2 Show Sets** tool *PepQuery Modifications* lists all available modifications.\n+\n+**Outputs**\n+    - Log.txt: \n+\n+      - Logging output from PepQuery2\n+      - When searching for *novel* peptides ignored peptide have a log message similar to: \n+\n+        - Ignore peptide (reason: exist in reference database): *PEPTIDE*\n+\n+      - When searching for *known* proteins, ignored protein have a log message similar to:\n+\n+        - Target protein is not present in database *DATABASE_NAME*: *PROTEIN_NAME*, ignored!\n+\n+    - Parameters: \n+      \n+      - parameters used in the search\n+\n+     - PSM - tabular with columns: \n+      \n+      - peptide modification n spectrum_title charge exp_mass ppm pep_mass mz score n_db total_db n_random total_random pvalue\n+\n+    - PSM Rank - tabular with columns: \n+      \n+      - peptide mo/dification n spectrum_title charge exp_mass ppm pep_mass mz score n_db total_db n_random total_random pvalue rank n_ptm\n+\n+    - An MGF with the best matching spectrums\n+\n+    - Detail - tabular with columns: \n+      \n+      - spectrum_title peptide modification pep_mass score\n+\n+    - PSM annotation - tabular with columns: \n+      \n+      - peptide Query calc_mr observed_mz charge pepSeq m_label m_mz m_intensity mz intensity\n+\n+     - PTM - tabular with columns: \n+      \n+      - spectrum_title peptide charge exp_mass pep_mass tol_ppm tol_da isotope_error modification score\n+\n+     - PTM Detail - tabular with columns: \n+      \n+      - peptide modification n spectrum_title charge exp_mass tol_ppm tol_da isotope_error pep_mass mz score n_db total_db n_random total_random pvalue rank ptm_spectrum_title ptm_peptide ptm_charge ptm_exp_mass ptm_pep_mass ptm_tol_ppm ptm_tol_da ptm_isotope_error ptm_modification ptm_score\n+\n+    - An Indexed MS/MS dataset *when MS/MS data is MGF, mzML, or mzXML history datasets*\n+\n+\n+.. _PepQuery: http://pepquery.org/document.html\n+\n+    ]]></help>\n+    <expand macro="citations" />\n+</tool>\n'
b
diff -r 000000000000 -r a07976bbc4d9 test-data/AgilentMassHunterTest.mzXML
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/AgilentMassHunterTest.mzXML Sun Nov 06 16:25:25 2022 +0000
b
b'@@ -0,0 +1,4263 @@\n+<?xml version="1.0" encoding="ISO-8859-1"?>\n+<mzXML xmlns="http://sashimi.sourceforge.net/schema_revision/mzXML_3.2"\n+       xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"\n+       xsi:schemaLocation="http://sashimi.sourceforge.net/schema_revision/mzXML_3.2 http://sashimi.sourceforge.net/schema_revision/mzXML_3.2/mzXML_idx_3.2.xsd">\n+  <msRun scanCount="212" startTime="PT0.668S" endTime="PT209.708S">\n+    <msInstrument msInstrumentID="1">\n+      <msManufacturer category="msManufacturer" value="instrument model"/>\n+      <msModel category="msModel" value="Agilent instrument model"/>\n+      <msIonisation category="msIonisation" value="microelectrospray"/>\n+      <msMassAnalyzer category="msMassAnalyzer" value="time-of-flight"/>\n+      <msDetector category="msDetector" value="microchannel plate detector"/>\n+      <software type="acquisition" name="MassHunter Data Acquisition" version="8.0"/>\n+    </msInstrument>\n+    <dataProcessing>\n+      <software type="conversion" name="ProteoWizard software" version="3.0.20287"/>\n+      <processingOperation name="Conversion to mzML"/>\n+    </dataProcessing>\n+    <scan num="676"\n+          scanType="Full"\n+          centroided="1"\n+          msLevel="1"\n+          peaksCount="164"\n+          polarity="+"\n+          retentionTime="PT0.668S"\n+          lowMz="101.059547842973"\n+          highMz="961.958412367698"\n+          basePeakMz="622.030137146612"\n+          basePeakIntensity="69123.5234"\n+          totIonCurrent="248205.188"\n+          msInstrumentID="1">\n+      <peaks compressionType="zlib"\n+             compressedLen="2042"\n+             precision="64"\n+             byteOrder="network"\n+             contentType="m/z-int">eJwtVXk81HkYJueqNkdS2Up0KJJ0b4c3MRvdslvKMY2jZpj7YEZ2hpkhGUc6aCsRSnSna7ccYzKdiErUWnYqtB0kalexvN/+fD7v8z7v877v9/f+wH9lTW5FohgSVu1t0dPTg60eP34dqLYA1davMsTKWIOMpmCIv3tfD7EmNkYX9AaEIjWJ35IWLK80AAbElQ/hbfJG3y9l3hDdlY/8bbcqs/O8x0H62gOoH0Ape/d6wBEi1icQrFh2Zr+LHaQuK8b8AGWZl9rJD2S+TtQhHKifMZ9TGw+ChWpArBRMz41+AcrAI8gP1Ej9O0rqIE2ejTho5fxj708uhcu3+XaI5WVPFhslQ6ZMmDOEg40OLdUdbAPGp3iCKdVWW3o2gqrCDOsFa7TNkLUS+OX/oT/qMGrBl4xEEKjZqE81YJ/dc8sBYrN02D91otjGwnc2HOx6QTCoepf0eoGofAL6pXqUOFMDPwOv/RXqU2kLj/+56SpEioehP+rxq0mpnt6QkJuDfrbrf6y58zkCslSJqLc9RCdVd1WDonMewdIBraunIcTarCe4suHlh3ljQOaRiP5ok1ecu7V6LzBHJ6M+LefmluvHZgMvzgD90HJ1Mp2tC+T/ew/7o1W8nigpNoGYrXq4L5rueybnbCMcsG4keroybUrDGGDsk6NeyJTY5ZvTNMAyaMN+QuID5mRtEwKnMJxgBc0qeuMNUHaewn5Cmmv96t7/BZwde1Av5K8n1Y7vpkPykR6Mh9LC5jw8UQlsQQHqh4aa7ztVdh44FafQb+jRXZoDjh1AH3MQ+WGeb08He10EUfwl1AsLVfcGT7oAJ9ZI0X+Yos0p5IEQhEnLsb+w48LiPvvJoBz7M/oL0zkmbjR2Bj5dh/rhuvWsgVQPYIpmYv7OkHar5U33IVt/IfJ3xhU5WLyvAdYa4m+nYpz7w/PdwJOR90439jtBWTsOeDMaMJ/u4B6yIGYMCPtLUJ+e501pNWmFmN5c1GNMae22vDgRMnT+yGdMm7DlSvtSYE1/jnoMzybHRW5BwD5qh/EIe6eGT71bgf0oA/UiHDzC86bWAa/cBPuLyEuwTSsfAdxf2fgeInSnlJN8SmDXwgmoF0lrdmn5eSwoq83RP9PeOzPuzR0QXq1GPlPRtEa5rgqivJ/ifJkFzzTHXzBBdkhL+Cct82b7USBlUyaJa90mjU6iAGcD0We+uJjp+7sDpDnPRD2WYWmLYZQEIjt3Yj5r95Y74X9QgJEwEv2yd6jELt65IAsqRT77xNsvNeppQH9Xg/rstvU31Qw94NmcxnyO4SzTcusoEPUcxPlxXJKKplyuBy59LfI5+83+KW6/DJJdO9EP17Jj9TX6UWCYd+P8uH7DMrfN6AGmewDqcS+Wvzd+LoSIbhrW55YUjzjUGg+RNoboj+fm6e/1rB5+vRuNcZ6flGpY4ArxGVYEC0o7ZvlsBuaFFajHq5wzxb1w/+B7/UCwJsX22uQg4G1KRT+8enq38nE98FiLcX98qzdG7A0WwJmCCwa+x7WAdRZ04ExuIvii3qylr34ApVsU9scvmdfwX3408HJ2YVxgbR79+s17kG9cRLDdHxOKd60FZZQt8gXzlzqfvTT4Dt5OxPoCdXCA/YrLwJ49F+sLerx3cymNwPNpRiy0yB3Rl1MOiu8ikC+cGlmTbd4KrKFuh7Cg9KdwszUQISP3UTR67s3T2sG9mmsxX7Rpt6vZmcHvGwhfdKmvacOR28BMJvdL9KC/bJbgF6Dbu6PfaIFq7MvtccB/2Yv86LP21HTROWDk/YPzFz9avbDoB1OgTxNjXDJvgF+iNYK0LCfMl3gN7zBb7QMMDaknufJy/cGCv2FPUivWk1Q9TdjsfBT4td/ibaZf/Wr2grDpCeKYBUHT7i3ph0SjCvQfQzlyh71vOIhCKrH/mP3X5g6bp4E43xmEn3+hfa3LKmDEkv9LTI+04QrDHLjf9KU2brHNC8QQGZeA/qSfEk5Yr+JAkn8cxmUG1dlafRfgZhG+bElMy4dSRxB+dEG/suKjrLCXvZC6zxr1ZZcKdyzTpwC3YTLOW86ZW30yXwadLYsI5hb+FlBfAXHJ27GenDe89lBANki+zV/O2+trbOEKPI4twfzzlMfObsA0OUv4AmNByOF1wNhI7qFc8NnW0dUJOA5/4/uRC19Ji2LdgNG2mMRFZRXqsQ+AlboB5yWPXsw31D8D5QdicF9ysX/8AcupwF6XTeISvb5pPl1AL/Im9WQ/Bj1MTYd9d9PQj8Ju5OO9Fafh8kryvSocR/'..b' id="116589">378031</offset>\n+    <offset id="117580">381307</offset>\n+    <offset id="118571">384710</offset>\n+    <offset id="119562">387835</offset>\n+    <offset id="120552">391129</offset>\n+    <offset id="121543">394293</offset>\n+    <offset id="122534">397521</offset>\n+    <offset id="123525">400897</offset>\n+    <offset id="124515">404214</offset>\n+    <offset id="125506">407398</offset>\n+    <offset id="126497">410787</offset>\n+    <offset id="127487">414032</offset>\n+    <offset id="128478">417353</offset>\n+    <offset id="129469">420629</offset>\n+    <offset id="130460">423770</offset>\n+    <offset id="131450">427287</offset>\n+    <offset id="132441">430500</offset>\n+    <offset id="133432">433684</offset>\n+    <offset id="134422">436925</offset>\n+    <offset id="135413">440324</offset>\n+    <offset id="136404">443585</offset>\n+    <offset id="137395">446910</offset>\n+    <offset id="138385">450182</offset>\n+    <offset id="139376">453393</offset>\n+    <offset id="140367">456574</offset>\n+    <offset id="141357">459818</offset>\n+    <offset id="142348">463059</offset>\n+    <offset id="143339">466171</offset>\n+    <offset id="144330">469259</offset>\n+    <offset id="145320">472432</offset>\n+    <offset id="146311">475746</offset>\n+    <offset id="147302">478931</offset>\n+    <offset id="148292">482272</offset>\n+    <offset id="149283">485480</offset>\n+    <offset id="150274">488757</offset>\n+    <offset id="151264">492146</offset>\n+    <offset id="152255">495391</offset>\n+    <offset id="153246">498660</offset>\n+    <offset id="154237">502031</offset>\n+    <offset id="155227">505396</offset>\n+    <offset id="156218">508629</offset>\n+    <offset id="157209">512145</offset>\n+    <offset id="158199">515486</offset>\n+    <offset id="159190">518951</offset>\n+    <offset id="160181">522200</offset>\n+    <offset id="161172">525409</offset>\n+    <offset id="162162">528734</offset>\n+    <offset id="163153">532019</offset>\n+    <offset id="164144">535208</offset>\n+    <offset id="165134">538537</offset>\n+    <offset id="166125">541785</offset>\n+    <offset id="167116">545074</offset>\n+    <offset id="168106">548291</offset>\n+    <offset id="169097">551655</offset>\n+    <offset id="170088">555127</offset>\n+    <offset id="171079">558319</offset>\n+    <offset id="172069">561432</offset>\n+    <offset id="173060">564728</offset>\n+    <offset id="174051">567889</offset>\n+    <offset id="175041">571225</offset>\n+    <offset id="176032">574386</offset>\n+    <offset id="177023">577714</offset>\n+    <offset id="178014">581271</offset>\n+    <offset id="179004">584548</offset>\n+    <offset id="179995">587829</offset>\n+    <offset id="180986">591066</offset>\n+    <offset id="181976">594310</offset>\n+    <offset id="182967">597631</offset>\n+    <offset id="183958">600891</offset>\n+    <offset id="184948">604107</offset>\n+    <offset id="185939">607267</offset>\n+    <offset id="186930">610672</offset>\n+    <offset id="187921">614049</offset>\n+    <offset id="188911">617390</offset>\n+    <offset id="189902">620642</offset>\n+    <offset id="190893">623791</offset>\n+    <offset id="191883">627112</offset>\n+    <offset id="192874">630464</offset>\n+    <offset id="193865">633753</offset>\n+    <offset id="194856">636862</offset>\n+    <offset id="195846">640119</offset>\n+    <offset id="196837">643207</offset>\n+    <offset id="197828">646456</offset>\n+    <offset id="198818">649723</offset>\n+    <offset id="199809">652979</offset>\n+    <offset id="200800">656501</offset>\n+    <offset id="201790">659817</offset>\n+    <offset id="202781">663034</offset>\n+    <offset id="203772">666247</offset>\n+    <offset id="204763">669528</offset>\n+    <offset id="205753">672948</offset>\n+    <offset id="206744">676253</offset>\n+    <offset id="207735">679618</offset>\n+    <offset id="208725">682911</offset>\n+    <offset id="209716">686056</offset>\n+  </index>\n+  <indexOffset>689294</indexOffset>\n+  <sha1>919d9f6aaa20533cbe9c75398a139a36bec4b6b0</sha1>\n+</mzXML>\n'
b
diff -r 000000000000 -r a07976bbc4d9 test-data/Uniprot.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Uniprot.fasta Sun Nov 06 16:25:25 2022 +0000
b
b'@@ -0,0 +1,20 @@\n+>sp|Q8C4J7|TBL3_MOUSE Transducin beta-like protein 3 OS=Mus musculus GN=Tbl3 PE=2 SV=1\n+MAETAAGLCRFKANYAVERKIEPFYKGGKAQLDQTGHYLFCVCGTKVNILDVASGALLRSLEQEDQEDITSFDLSPDDEVLVTASRALLLAQWAWREGTVTRLWKAIHTAPVASMAFDATSTLLATGGCDGAVRVWDIVQHYGTHHFRGSPGVVHLVAFHPDPTRLLLFSSAVDTSIRVWSLQDRSCLAVLTAHYSAVTSLSFSEGGHTMLSSGRDKICIVWDLQSYQTTRTVPVFESVEASVLLPEQPAPALGVKSSGLHFLTAGDQGILRVWEAASGQCVYTQPQMPGLRQELTHCTLARAADLLLTVTADHNLLLYEAHSLQLQKQFAGYSEEVLDVRFLGPSDSHIVVASNSPCLKVFELQTLACQILHGHTDIVLALDVFRKGWLFASCAKDQSIRIWKMNKAGQVACVAQGSGHTHSVGTICCSRLKESFLVTGSQDCTVKLWPLPEALLAKSTAADSGPVLLQAQTTRRCHDKDINSLAVSPNDKLLATGSQDRTAKLWALPQCQLLGVFTGHRRGLWNVQFSPTDQVLATASADGTIKLWALQDFSCLKTFEGHDASVLKVAFVSRGSQLLSSGSDGLLKLWTIKSNECVRTLDAHEDKVWGLHCSQLDDHAITGGSDSRIILWKDVTEAEQAEEQAKREEQVIKQQELDNLLHEKRYLRALGLAISLDRPHTVLTVIQAIRRDPEACEKLEATVLRLRRDQKEALLRFCVTWNTNSRHCHEAQAVLGVLLRHEAPEELLAYDGVRGSLEALLPYTERHFQRLSRTLQAATFLDFLWHNMKLSPCPAAAPPAL\n+>tr|Q80ZP8|Q80ZP8_MOUSE Armet protein OS=Mus musculus GN=Manf PE=1 SV=1\n+METNNYLPSPPSFPVCISYLGRFYQDLKDRDVTFSPATIEEELIKFCREARGKENRLCYYIGATDDAATKIINEVSKPLAHHIPVEKICEKLKKKDSQICELKYDKQIDLSTVDLKKLRVKELKKILDDWGEMCKGCAEKSDYIRKINELMPKYAPKAASARTDL\n+>sp|Q60847|COCA1_MOUSE Collagen alpha-1(XII) chain OS=Mus musculus GN=Col12a1 PE=2 SV=3\n+MQTRLPRALAALGVALLLSSIEAEVDPPSDLNFKIIDENTVHMSWERPVDPIVGYRITVDPTTDGPTKEFTLAASTTETLLSDLIPETQYVVTITSYNEVEESVPVIGQLTIQTGGPTKPGEKKPGKTEIQKCSVSAWTDLVFLVDGSWSVGRNNFKYILDFIVALVSAFDIGEEKTRVGVVQYSSDTRTEFNLNQYYRREDLLAAVKKIPYKGGNTMTGDAIDYLVKNTFTESAGSRAGFPKVAIIITDGKSQDEVEIPARELRNIGVEVFSLGIKAADAKELKQIASTPSLNHVFNVANFDAIVDIQNEIISQVCSGVDEQLGELVSGEEVIEPPSNLVVTELSSKYIRLSWDPSPSAVTGYKILLTPMAAGSRHHALSVGPQTTTLNVRDLTADTEYQISVFAMKGLTSSEPTSVMEKTQPMKVQVECSRGVDIKADIVFLVDGSYSIGIANFVKVRAFLEVLAKSFEISPNRVQISLVQYSRDPHTEFTLKEFNRVEDIIKAINTFPYRGGSTNTGKAMTYVREKIFVPNKGSRSNVPKVMILITDGKSSDAFRDPAIKLRNSDVEIFAVGVKDAVRSELEAIASPPAETHVFTVEDFDAFQRISFELTQSICLRIEQELAAIKKKAYVPPKDLRFTQVTANSFKAEWSPPGDNVFSYHVTYKDANGDDEVTVVEPASSTSVVLNNLRPETLYLVNVTAEYEDGFSVPITGEETTAEVKGVPRNLKVTDETTDSFKLTWSQAPGRVLRYRIRYRPVSGGESKEVSTPANQRRKTLENLTPDTKYEISVIAEYSSGPGSPLTGNAATEEVRGNPRDLRVSDATTSTLKLSWSRAPGKVKQYLVTYTPAAGGETQEVTVRGDTTTTMLRKLKEGTQYDLSVTALYASGAGEALSGKGSTLEERGSPQNLVTKDITDTSIGAYWTSAPGMVRGYRVSWKSLYDDIEAGETTLPGDAIHTMIENLQPETKYKISVFATYSSGEGEPVTGDATTELSQDSKILRVDEETEHTMRVTWKAAPGKVVNYRVVYRPQGGGRQMVAKVPPTVTSTVLKRLQPQTTYDITVLPMYKTGEGKLRQGSGTTASRFKSPRNLKTSDPTMSSFRVTWEPAPGEVKGYKVTFHPTGDDRRLGELVLGPYDNTVVLEELRAGTTYRVNVFGMFDGGESLPLVGQEMTTLSDTTVTPFLSSGMDCLTRAEADIVLLVDGSWSIGRANFRTVRSFISRIVEVFEIGPKRVQIALAQYSGDPRTEWQLNAHRDKKSLLQAVANLPYKGGNTLTGMALNFIRQQSFKTQAGMRPRARKIGVLITDGKSQDDVEAPSKKLKDEGVELFAIGIKNADEVELKMIATDPDDTHAYNVADFESLSKIVDDLTINLCNSVKGPGDLEAPTNLVISERTHRSFRVSWTPPSDSVDRYKVEYYPVSGGKRQEFYVSRLDTSTVLKDLKPETDYVVNVYSVVEDEYSEPLKGTEKTLPVPVVSLNIYDVGPTTMHVQWQPVGGATGYTVSYQPTRSPEGTKPKEMRVGPTVNDVQLTGLLPNTEYEVTVQAVLYDLTSEPAKAREVTLPLPRPQDVKLRDVTHSTMNVVWEPVLGKVRKYIVRYKTPDEEFKEVEVDRSRASTILKDLSSQTQYTVSVSAVYDEGTSPPATAYDTTRRVPAPTNLQFTEVTPESFRGTWDHGASDVSLYRITWAPVGNPDKMETILNGDENTLVFENLNPNTPYEVSITAIYPDESESEDLSGTERTLRLIPLTTQAPKSGPRNLQVYNATSNSLTVKWDPASGRVQKYRITYQPSTGEGNEQTITVGGRQNSVLLQKLKPDTPYTITVYSQYPDGEGGRMTGRGKTKPLNTVRNLRVYDPSTSSLSVRWDHAEGNPRQYKLFYAPTSGGPEELVPIPGNTNYAILRNLQPDTPYTITVVPVYTEGDGGRTSDTGRTLVRGLARNIQVYNPTPNSLDVRWDPAPGPVQQYRIVYSPVAGTRPSESIVVPGNTRTVHLERLIPDTPYSVNIVALYSDGEGNPSPSQGRTLPRSGPRNIRVFGETTNSLSVAWDHADGPVQQYRIIYSPTVGDPIDEYTTVPGRRNNVILQPLQPDTPYKITVIAIYEDGDGGHLTGNGRTVGLLPPQNIHIFDEWYTRFRVSWDPSPSPVLGYKIVYKPVGSNEPMEAFVGEVTSYTLHNLNPSTTYDVSVYAQYDSGLSVPLTDQGTTLYLNVTDLKTYQVGWDTFCVKWSPHRAATSYRLKLSPADGTRGQEITVRGSETSHCFTGLSPEAEYGVTVFVQTPNLEGPGVPIKEQTTVKPTEAPTEPPTPSPPPTIPPARDVCKGAKADIVFLTDASWSIGDDNFNKVVKFIFNTVGAFDEVNPAGIQVSFVQYSDEVKSEFKLNTYNDKALALGALQNIRYRGGNTRTGKALTFIKEKVLTWESGMRKNVPKVLVVVTDGRSQDEVKKAAFVIQQSGFSVFVVGVADVDYNELANIASKPSERHVFIVDDFESFEKIEDNLITFVCETATSSCPLIYLDGYTSPGFKMLEAYNLTEKNFASVQGVSLESGSFPSYSAYRLQKNAFINQPTAELHPNGLPPSYTIILLFRLLPETPSDPFAIWQITDRDYRPQVGVIADPSSKTLSFFNKDTRGEVQTVTFDTDEVKTLFYGSFHKVHIVVTSKSVKIYIDCYEIIEKDIKEAGNITTDGYEILGKLLKGERKSATFQIQSFDIVCSPVWTSRDRCCDIPSRRDEAKCPALPNACTCTQDSVGPPGPPGPAGGPG'..b'GPPGPRGDTGPPGPQGPPGPQGPNGLSIPGEQGRQGMKGDAGEPGLPGRTGTPGLPGPPGPMGPPGDRGFTGKDGAMGPRGPPGPPGSPGSPGVTGPSGKPGKPGDHGRPGQSGLKGEKGDRGDIASQNMMRAVARQVCEQLISGQMSRFNQMLNQIPNDYHSSRNQPGPPGPPGPPGSAGARGEPGPGGRPGFPGTPGMQGPPGERGLPGEKGERGTGSQGPRGPPGPPGPQGESRTGPPGSTGSRGPPGPPGRPGNSGIRGPPGPPGYCDSSQCASIPYNGQGYPEPYVPEGGAYLPEREPFIVPVEPERTAEYEDDYGADEPDQQHPDHMRWRRALRPGPAE\n+>tr|D6RFR8|D6RFR8_MOUSE Choline/ethanolaminephosphotransferase 1 OS=Mus musculus GN=Cept1 PE=4 SV=1\n+MSGHRSTRKRCGDSHPESPVGFGHMSTTGHLCGLILPVLVAFSFTSLWMP\n+>tr|Q91VK2|Q91VK2_MOUSE Eef1d protein OS=Mus musculus GN=Eef1d PE=1 SV=1\n+MATNFLAHEKIWFDKFKYDDAERRFYEQMNGPVTSGSRQLKVMLPNSPEALGQATPGTSSGPGASSGPGGDHSELIVRITSLEVENQNLRGVVQDLQQAISKLEARLSSLEKSSPTPRATAPQTQHVSPMRQVEPPTKKGATPAEDDEDKDIDLFGSDEEEEDKEAARLREERLRQYAEKKAKKPTLVAKSSILLDVKPWDDETDMAQLETCVRSIQLDGLVWGASKLVPVGYGIRKLQIQCVVEDDKVGTDLLEEEITKFEEHVQSVDIAAFNKI\n+>tr|F6WN43|F6WN43_MOUSE Iron-sulfur cluster co-chaperone protein HscB, mitochondrial (Fragment) OS=Mus musculus GN=Hscb PE=1 SV=1\n+XQKSQTEKHFSDKHSTLVNDAYKTLQAPLTRGLYLVS\n+>sp|Q6NXK2|ZN532_MOUSE Zinc finger protein 532 OS=Mus musculus GN=Znf532 PE=1 SV=1\n+MTMGDMKTPDFDDLLAAFDIPDMVDPKAAIESGHDDHESHIKQNAHVDDDSHTPSSSDVGVSVIVKNVRNIDSSEGVEKDGHNPTGNGLHNGFLTASSLDSYGKDGAKSLKGDTPASEVTLKDPAFSQFSPISSAEEFEDDEKIEVDDPPDKEEARAGFRSNVLTGSAPQQDFDKLKALGGENSSKTGVSTSGHTDKNKVKREAESNSITLSVYEPFKVRKAEDKLKENSEKMLESRVLDGKPSSEKSDSGIAAAASSKTKPSSKLSSCIAAIAALSAKKAASDSCKEPVANSREASPLPKEVNDSPKAADKSPESQNLIDGTKKASLKPSDSPRSVSSENSSKGSPSSPVGSTPAIPKVRIKTIKTSSGEIKRTVTRVLPEVDLDSGKKPSEQAASVMASVTSLLSSSASATVLSSPPRAPLQTAMVTSAVSSAELTPKQVTIKPVATAFLPVSAVKTAGSQVINLKLANNTTVKATVISAASVQSASSAIIKAANAIQQQTVVVPASSLANAKLVPKTVHLANLNLLPQGAQATSELRQVLTKPQQQIKQAIINAAASQPPKKVSRVQVVSSLQSSVVEAFNKVLSSVNPVPVYTPNLSPPANAGITLPMRGYKCLECGDAFALEKSLSQHYDRRSVRIEVTCNHCTKNLVFYNKCSLLSHARGHKEKGVVMQCSHLILKPVPADQMIVPPSSNTAASTLQSSVGAATHTVPKVQPGIAGAVISAPASTPMSPAMPLDEDPSKLCRHSLKCLECNEVFQDEPSLATHFQHAADTSGQQMKKHPCRQCDKSFSSSHSLCRHNRIKHKGIRKVYACSHCPDSRRTFTKRLMLERHIQLMHGIKDPDVKELSDDAGDVTNDEEEEAEIKEDAKVPSPKRKLEEPVLEFRPPRGAITQPLKKLKINVFKVHKCAVCGFTTENLLQFHEHIPQHRSDGSSHQCRECGLCYTSHGSLARHLFIVHKLKEPQPVSKQNGAGEDSQQENKPSPEDEAAEGAASDRKCKVCAKTFETEAALNTHMRTHGMAFIKSKRMSSAEK\n+>sp|P58006|SESN1_MOUSE Sestrin-1 OS=Mus musculus GN=Sesn1 PE=1 SV=3\n+MRLAAASNEAYAASLAVSELLSCHQCGGDRGQDEELGIRIPRPLGHGPSRFIPEKEMLQVGSEDAQMHALFADSFAALGRLDNITLVMVFHPQYLESFLKTQHYLLQMDGPLPLHYRHYIGIMAAARHQCSYLVNLHVSDFLHVGGDPKWLNGLENAPQKLQNLGELNKVLAHRPWLITKEHIEGLLKAEEHSWSLAELVHAVVLLTHYHSLASFTFGCGISPEIHCDGGHTFRPPSVSNYCICDITNGNHSVDEMQVNSAGNASVSDSFFEVEALMEKMRQLQECREEEEASQEEMASRFEMEKRESMFVFSSDDDEVTPARDVSRHFEDTSYGYKDFSRHGMHVPTFRVQDYCWEDHGYSLVNRLYPDVGQLIDEKFHIAYNLTYNTMAMHKDVDTSMLRRAIWNYIHCMFGIRYDDYDYGEINQLLDRSFKVYIKTVVCTPEKVTKRMYDSFWRQFKHSEKVHVNLLLIEARMQAELLYALRAITRYMT\n+>tr|A0A1B0GSE5|A0A1B0GSE5_MOUSE Ubiquitin carboxyl-terminal hydrolase CYLD OS=Mus musculus GN=Cyld PE=1 SV=1\n+MSSGLWSQEKVTSPYWEERIFYLLLQECSVTDKQTQKLLKVPKGSIGQYIQDRSVGHSRVPSTKGKKNQIGLKILEQPHAVLFVDEKDVVEINEKFTELLLAITNCEERLSLFRNRLRLSKGLQVDVGSPVKVQLRSGEEKFPGVVRFRGPLLAERTVSGIFFGVELLEEGRGQGFTDGVYQGKQLFQCDEDCGVFVALDKLELIEDDDNGLESDFAGPGDTMQVEPPPLEINSRVSLKVGESTESGTVIFCDVLPGKESLGYFVGVDMDNPIGNWDGRFDGVQLCSFASVESTILLHINDIIPDSVTQERRPPKLAFMSRGVGDKGSSSHNKPKVTGSTSDPGSRNRSELFYTLNGSSVDSQQSKSKNPWYIDEAFGGYLSEVVEENTPPKMEKEGLEIMIGKKKGIQGHYNSCYLDSTLFCLFAFSSALDTVLLRPKEKNDIEYYSETQELLRTEIVNPLRIYGYVCATKIMKLRKILEKVEAASGFTSEEKDPEEFLNILFHDILRVEPLLKIRSAGQKVQDCNFYQIFMEKNEKVGVPTIQQLLEWSFINSNLKFAEAPSCLIIQMPRFGKDFKLFKKIFPSLELNITDLLEDTPRQCRICGGLAMYECRECYDDPDISAGKIKQFCKTCSTQVHLHPRRLNHSYHPVSLPKDLPDWDWRHGCIPCQKMELFAVLCIETSHYVAFVKYGKDDSAWLFFDSMADRDGGQNGFNIPQVTPCPEVGEYLKMSLEDLHSLDSRRIQGCARRLLCDAYMCMYQSPTMSLYK\n+>sp|Q60880|OL141_MOUSE Olfactory receptor 141 OS=Mus musculus GN=Olfr141 PE=3 SV=2\n+MRNITEATFFVLKGLTDNNELQIILFLLFLAIYIFTLIGNVGLIILVVGDSQLHNPMYCFLSVLSSVDACYSTDITPNMLVGFMSKSKIISFYGCATQMFLAVTFGTTECFLLAAMAYDRYVAIHDPLLYAVSMSPRVYIPLIIASYAGGIVHAIIHTVATFSLSFCRSNEVKHIFCDIPPLLAISCSETYVNELLLFFFVSFIELVTILIVLVSYAFILLSILKMNSSEGRRKVFSTCGAHLTAVSIYYGTILFMYVRPSSNYSLEHDMIVSTFYTIGIPMLNPIIYSLRNKDVKEAMKRVLRKKINIKHRIKKLNDFSVFLMP\n'
b
diff -r 000000000000 -r a07976bbc4d9 test-data/iTRAQ_f4.mgf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iTRAQ_f4.mgf Sun Nov 06 16:25:25 2022 +0000
b
b'@@ -0,0 +1,753 @@\n+COM=Conversion to mascot generic\n+CHARGE=2+ and 3+\n+BEGIN IONS\n+PEPMASS=740.462952\n+CHARGE=3+\n+SCANS=277\n+TITLE=Mo_Tai_iTRAQ_f4.00277.00277.3\n+111.017494 85.198502\n+112.240982 97.204994\n+114.110542 168.274780\n+115.107582 369.265503\n+115.650398 84.005325\n+117.296082 86.641182\n+117.595589 82.974037\n+120.657990 81.247025\n+123.208023 88.939392\n+126.714996 76.470490\n+126.995316 81.651260\n+129.369080 82.580246\n+129.410400 90.817963\n+132.734039 124.614685\n+143.307465 87.847046\n+178.966888 94.961578\n+179.972855 89.878273\n+183.256714 104.533241\n+188.080093 123.015953\n+212.102753 442.314178\n+213.104324 84.621696\n+233.001801 107.842552\n+244.242355 102.163200\n+281.079132 97.696259\n+291.216034 243.588058\n+309.183807 104.681831\n+325.188324 282.187622\n+345.226288 167.099777\n+347.629883 88.744476\n+357.377533 105.747673\n+388.266266 1321.324341\n+430.317047 94.113419\n+458.310547 310.033203\n+489.807434 100.114334\n+490.700165 99.780800\n+501.355072 164.809708\n+517.545532 119.780251\n+529.344849 395.354340\n+529.599487 100.128220\n+535.189514 101.317970\n+657.405518 110.483780\n+699.552063 101.576553\n+736.234497 130.142654\n+752.286011 111.876389\n+756.181641 93.424118\n+771.447876 505.619843\n+776.288391 100.766472\n+804.153748 99.673531\n+840.959473 131.680695\n+870.515198 596.371582\n+871.524719 224.175797\n+938.853760 112.032951\n+983.596008 538.290894\n+985.851929 109.672272\n+999.183228 110.428818\n+1006.435791 110.520103\n+1098.597168 117.997414\n+1102.095825 108.774673\n+1154.624023 115.541344\n+1179.853027 115.300293\n+1188.129639 112.100708\n+1328.742920 120.317390\n+1535.381592 114.408516\n+1578.387207 112.895355\n+1696.229492 122.310112\n+1865.684937 119.336388\n+1891.318359 108.014870\n+END IONS\n+BEGIN IONS\n+PEPMASS=596.816895\n+CHARGE=2+\n+SCANS=3419\n+TITLE=Mo_Tai_iTRAQ_f4.03419.03419.2\n+112.086548 2060.700684\n+113.070908 591.413391\n+114.110237 56227.753906\n+115.107254 40715.632813\n+116.110573 1253.002075\n+124.087646 334.579498\n+129.065491 335.658569\n+129.682831 322.525909\n+130.096924 432.119598\n+135.059509 290.456573\n+135.933548 316.717255\n+141.158234 324.162384\n+143.102081 1042.657227\n+143.108337 991.155334\n+145.106369 4993.616699\n+145.112579 9580.018555\n+146.116013 348.826385\n+151.422028 339.654999\n+152.189240 352.970459\n+155.080811 320.076233\n+156.112503 802.023926\n+157.107681 821.452209\n+158.092041 3474.361572\n+163.116852 649.046387\n+163.123260 573.363525\n+163.860764 368.470825\n+172.107132 547.236511\n+173.091751 424.643494\n+173.713470 325.451202\n+174.132874 1181.682129\n+174.138977 1457.565674\n+175.118500 19209.625000\n+176.121841 895.593079\n+180.310822 302.979675\n+185.090881 577.591370\n+185.163925 667.431763\n+189.086395 384.102600\n+193.535583 299.085999\n+198.085999 304.650818\n+202.127197 776.504089\n+202.133865 1047.345337\n+205.158951 325.465912\n+206.438217 407.963379\n+215.112625 944.689087\n+216.097275 349.972809\n+216.178452 628.929138\n+216.187073 1542.270264\n+218.158371 710.665344\n+219.997772 493.154785\n+226.117889 345.579254\n+227.530579 380.890015\n+229.117340 398.719696\n+231.095993 553.909363\n+232.139694 11610.142578\n+233.142776 541.624878\n+240.132904 413.648132\n+242.112793 354.861603\n+242.148621 757.952148\n+244.147949 340.507446\n+244.181870 1394.464355\n+244.207031 351.863098\n+246.153458 2635.449219\n+246.159882 2076.769775\n+255.143784 947.695679\n+260.123077 377.649994\n+261.163208 358.264160\n+268.138641 800.600464\n+269.122375 665.910522\n+269.220001 322.280029\n+271.175507 2574.782715\n+271.523804 335.527252\n+272.170105 1414.468018\n+274.152344 1745.901855\n+279.726440 358.126434\n+286.150787 2142.241211\n+287.134125 399.345337\n+287.153320 381.299835\n+288.201630 1045.604614\n+289.161011 642.731201\n+297.189941 313.076477\n+303.175964 1238.757568\n+304.159454 718.974304\n+309.070404 557.175232\n+309.572754 389.136902\n+315.128113 438.987366\n+315.165070 394.897858\n+318.127045 852.624146\n+329.155304 359.383026\n+330.138916 745.477112\n+330.163727 587.573120\n+332.788940 345.351257\n+341.179504 329.149353\n+343.196503 430.196503\n+345.225616 879.687500\n+346.184479 34'..b'08055.3\n+110.070747 1733.929932\n+112.086494 691.703613\n+114.110207 40570.949219\n+115.107246 29732.470703\n+116.110382 1231.719482\n+116.696106 632.937317\n+117.730354 471.628967\n+124.086235 1593.573853\n+127.085846 719.726074\n+127.191467 500.313782\n+129.064926 511.926025\n+129.129395 1360.861450\n+136.075058 651.347961\n+137.249298 489.442627\n+143.102310 528.153137\n+143.108459 983.870300\n+145.106354 5602.307617\n+145.112564 9344.262695\n+155.080536 649.520813\n+158.091660 1477.552002\n+162.132690 594.649658\n+162.139435 534.015381\n+173.417542 600.326477\n+175.118454 8973.086914\n+176.120972 555.123108\n+178.371323 511.018158\n+183.148560 607.971863\n+186.086960 652.429138\n+188.148453 816.252747\n+188.154907 1523.843628\n+199.106628 571.695862\n+206.436493 1035.268555\n+212.269272 591.934021\n+214.144180 900.448364\n+216.150284 2525.229248\n+227.101578 976.558044\n+230.201385 1142.054443\n+242.148682 1397.006470\n+243.107559 677.465942\n+243.133698 1371.145142\n+244.138000 891.661987\n+244.180954 1242.425537\n+246.153366 2297.038574\n+254.730103 532.118347\n+255.144455 987.050415\n+256.688324 533.629761\n+257.158569 875.375305\n+272.170959 2529.128906\n+272.908997 502.400146\n+274.186554 13132.186523\n+287.221313 1091.025513\n+291.214172 2984.217773\n+300.154175 1022.979675\n+308.174438 1182.723389\n+311.169250 569.517273\n+315.217712 1153.479858\n+320.089233 1019.081665\n+329.195770 1409.046875\n+330.298096 523.613220\n+331.206055 940.368896\n+345.223816 1784.856079\n+348.235840 683.953247\n+348.581970 560.229858\n+368.226654 641.918640\n+371.281464 720.593628\n+372.184631 537.945129\n+378.248566 1106.098633\n+379.243256 531.171021\n+386.216095 1908.169556\n+388.270569 1083.493164\n+399.715698 3641.003906\n+402.287842 531.509766\n+407.745789 883.040344\n+407.965881 569.346497\n+412.240295 632.917664\n+415.698425 1032.095337\n+428.227112 4306.428711\n+428.261108 1225.675537\n+428.725769 881.870422\n+429.260712 3728.557373\n+429.697418 1331.391235\n+445.288818 567.610901\n+448.071899 583.037292\n+455.416718 647.968628\n+464.268341 654.572754\n+470.773743 1128.713501\n+472.250061 3780.671875\n+473.252808 1594.682739\n+473.278687 2412.803467\n+481.325806 1259.738159\n+484.769775 1385.499390\n+485.271332 613.115601\n+491.173309 585.062622\n+491.329742 911.582214\n+497.316864 671.196655\n+499.275757 1172.343262\n+499.337067 1123.132935\n+500.283569 1279.582520\n+500.335480 1331.533203\n+501.255157 671.378113\n+506.350983 526.060120\n+515.294067 595.644592\n+520.279419 564.501221\n+528.327942 1453.140137\n+528.796143 1023.938416\n+530.344971 699.704163\n+534.306091 632.479187\n+556.821533 578.409241\n+557.308167 996.385559\n+562.368835 1061.597290\n+562.630188 599.749634\n+563.383240 597.036011\n+572.329102 704.391174\n+575.329651 597.594116\n+578.266602 569.538757\n+584.834595 1397.603638\n+585.341125 596.237427\n+585.828064 634.964417\n+592.849548 948.947998\n+593.338867 8331.064453\n+593.809753 1243.525757\n+593.850098 3570.665283\n+594.347534 5469.266113\n+601.328064 1251.846069\n+612.421753 868.523682\n+615.363525 1159.816772\n+635.785217 692.349304\n+645.406799 926.912354\n+647.354187 1344.844971\n+660.368103 1515.965698\n+667.035950 629.281006\n+678.553528 864.705811\n+686.401672 1415.408081\n+687.406799 956.555176\n+701.317932 638.253906\n+713.436462 577.175781\n+714.438171 979.025330\n+721.332031 1133.021240\n+734.864807 659.578308\n+758.495483 1101.013306\n+759.436768 1680.954834\n+814.488220 766.761841\n+825.458008 2101.567139\n+873.476807 3603.638672\n+876.500122 1146.794800\n+877.493591 2904.569092\n+878.501526 2154.676025\n+879.500305 1179.630981\n+896.207703 648.875244\n+914.434082 1090.736938\n+914.517822 1977.191284\n+928.515015 1886.298706\n+930.495483 1311.800903\n+952.429504 625.323181\n+965.766296 606.633911\n+972.546692 2437.769531\n+999.546753 632.162537\n+1026.609131 980.280151\n+1040.573853 1742.042114\n+1041.564087 3165.200439\n+1042.581787 3063.955566\n+1043.577515 6683.765625\n+1045.518311 945.700500\n+1147.621704 832.881104\n+1148.635742 1159.247681\n+1467.104980 653.335815\n+1533.474243 661.718018\n+1620.307251 616.238525\n+1664.717529 648.275024\n+END IONS\n'
b
diff -r 000000000000 -r a07976bbc4d9 test-data/immunopeptidomics.mgf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/immunopeptidomics.mgf Sun Nov 06 16:25:25 2022 +0000
b
b'@@ -0,0 +1,464 @@\n+BEGIN IONS\n+TITLE=controllerType=0 controllerNumber=1 scan=19846\n+RTINSECONDS=2320.06458\n+PEPMASS=383.529876708984\n+CHARGE=3+\n+84.0449677 46347.0703125\n+84.0813446 85493.9453125\n+86.0719299 7175.7060546875\n+86.0969772 135316.21875\n+87.0795746 57686.53515625\n+89.5852509 6013.955078125\n+91.0547638 26870.0390625\n+100.0871506 10508.3408203125\n+101.0712357 8028.2236328125\n+102.0548477 7109.3364257813\n+110.071434 72448.5390625\n+112.0872192 68537.90625\n+116.0708847 66026.75\n+116.6829987 7043.2426757813\n+119.0492325 28436.21484375\n+120.0808487 28182.986328125\n+123.0442657 6282.2768554688\n+127.0979004 32528.88671875\n+129.1026154 74929.3046875\n+129.1124268 15517.341796875\n+132.1023407 7616.8291015625\n+136.075592 267654.46875\n+137.0793915 44604.71484375\n+140.0816498 8406.1591796875\n+145.4732819 7887.0209960938\n+147.0440521 10594.44921875\n+147.1123962 10032.357421875\n+155.0816803 6984.1274414063\n+157.1085968 34948.90234375\n+165.0540466 39318.01953125\n+167.0815887 29707.244140625\n+168.085022 6312.9848632813\n+182.0816193 28942.546875\n+183.1242371 7433.0512695313\n+183.1487885 8203.357421875\n+193.0978699 6826.6010742188\n+195.0764313 23284.12109375\n+195.1120148 9413.0185546875\n+197.1287689 31395.33203125\n+198.132309 9345.76953125\n+199.7877808 5461.4345703125\n+213.0883179 6907.8862304688\n+217.1338043 13646.8583984375\n+219.1365814 28881.201171875\n+226.1663971 13425.7822265625\n+244.165451 62294.3984375\n+245.1695709 14033.3974609375\n+249.673233 32895.77734375\n+254.1607361 72503.140625\n+255.1666107 6893.8310546875\n+259.0739441 12570.2685546875\n+260.0770569 6460.126953125\n+271.1891785 9831.76953125\n+275.1358337 11066.83984375\n+304.6169434 9695.1650390625\n+308.5368347 10936.181640625\n+308.8744507 6715.9243164063\n+311.181427 8423.06640625\n+326.7102356 8839.98828125\n+328.2081909 21860.5078125\n+329.8709106 7965.8657226563\n+330.2044983 8398.9033203125\n+331.1609192 7686.9453125\n+333.8371277 25565.46484375\n+334.1699219 7952.1284179688\n+339.8395081 31163.154296875\n+340.1759949 26240.822265625\n+340.6808167 36919.71484375\n+342.1118774 7167.1025390625\n+342.1811218 10171.65234375\n+346.5349731 7574.7329101563\n+347.7381592 9350.056640625\n+348.4993286 7552.921875\n+353.6708679 38643.10546875\n+354.1769409 6889.3901367188\n+354.2250671 21217.833984375\n+361.6572571 6491.6513671875\n+362.1836853 6020.7607421875\n+363.1853333 8824.9462890625\n+377.2033691 6569.89453125\n+381.2067871 7040.6538085938\n+383.2186279 68377.4609375\n+383.3130188 116036.234375\n+383.526886 42512.03125\n+385.2560425 10095.142578125\n+398.2119751 25488.392578125\n+401.2857666 10739.900390625\n+410.2869873 10938.7431640625\n+417.2008667 6045.6533203125\n+417.696991 8364.318359375\n+418.2027893 8019.1762695313\n+426.2158203 9391.662109375\n+428.8858948 6009.2065429688\n+431.206543 9535.4150390625\n+451.2514343 6296.6337890625\n+465.7139282 6659.9360351563\n+466.2247925 8575.556640625\n+475.2226257 6292.1694335938\n+488.2868042 7346.7373046875\n+489.2886047 30622.896484375\n+491.2367249 8038.7392578125\n+492.2262268 27380.2578125\n+496.3111572 9502.2919921875\n+498.3398438 83627.8203125\n+499.348114 9477.421875\n+502.2510376 7497.5302734375\n+502.8083191 7691.1728515625\n+518.2723389 29630.49609375\n+519.2763672 13119.953125\n+656.3309937 6904.6923828125\n+673.3564453 8458.634765625\n+END IONS\n+BEGIN IONS\n+TITLE=controllerType=0 controllerNumber=1 scan=19905\n+RTINSECONDS=2325.98454\n+PEPMASS=534.22802734375\n+CHARGE=2+\n+74.0607834 11525.5478515625\n+80.820961 1134.3864746094\n+84.0448685 11916.904296875\n+84.0813599 24140.73046875\n+86.0719757 1059.546875\n+86.0969696 48334.11328125\n+87.0556259 2711.1242675781\n+87.0794067 2536.3103027344\n+87.099884 1441.4647216797\n+88.0397949 1339.0686035156\n+89.0711365 5940.744140625\n+95.5842514 960.4934692383\n+100.0871887 1435.1180419922\n+101.0711517 11117.935546875\n+102.0551834 7843.828125\n+104.0528793 2629.0866699219\n+107.0505447 1256.6583251953\n+107.47509 1007.3388061523\n+110.0714264 24055.96484375\n+112.087204 2137.0339355469\n+115.0872574 2242.5446777344\n+119.0812531 1181.8509521484'..b'68.3342896 1452.5230712891\n+682.3339233 1898.4290771484\n+683.3429565 1458.1762695313\n+696.3226318 1923.4722900391\n+784.5008545 6190.7158203125\n+790.3800659 2451.6320800781\n+819.3933716 4207.2880859375\n+820.4173584 2018.9385986328\n+824.4292603 11264.025390625\n+869.4186401 2067.2492675781\n+882.4277954 1771.7611083984\n+884.423584 1570.5802001953\n+885.4588623 2440.49609375\n+955.4633789 7311.4379882813\n+969.456604 2234.6115722656\n+END IONS\n+BEGIN IONS\n+TITLE=controllerType=0 controllerNumber=1 scan=19944\n+RTINSECONDS=2329.22502\n+PEPMASS=516.783386230469\n+CHARGE=2+\n+72.0815811 27197.671875\n+74.0610199 4197.1069335938\n+84.0451736 15634.2109375\n+84.0815887 26392.96875\n+86.0969391 88900.34375\n+87.0557785 6371.4975585938\n+87.1004715 5257.353515625\n+88.0400085 4621.7041015625\n+101.0712738 5125.9956054688\n+102.0554962 23467.248046875\n+107.0487747 4362.7963867188\n+110.0715256 339710.21875\n+111.0756683 11064.5341796875\n+112.0868912 4111.2602539063\n+116.0706635 55538.3046875\n+120.080925 26441.748046875\n+127.0875549 4627.248046875\n+129.102829 26702.419921875\n+132.1021881 5254.7578125\n+133.0611267 3728.3393554688\n+136.0756378 91992.3203125\n+137.0794525 4378.3774414063\n+138.0666656 7507.4252929688\n+145.5386963 6195.8090820313\n+157.1097717 3760.1879882813\n+159.0761414 3559.2092285156\n+166.086441 5174.974609375\n+169.0968933 6497.8017578125\n+173.09198 66982.4140625\n+180.113205 6698.7612304688\n+181.0975647 20135.044921875\n+182.081604 7997.3110351563\n+183.1493378 16863.73046875\n+197.1275787 6301.8452148438\n+202.0863037 3530.7102050781\n+208.1073456 25956.681640625\n+209.0920258 14764.1796875\n+218.0425568 28767.90234375\n+229.1558533 5750.8208007813\n+233.0927124 4071.7492675781\n+235.1186981 36820.6640625\n+243.1336212 24782.921875\n+267.1106567 5503.90625\n+278.1124878 4135.1215820313\n+286.1757813 15374.74609375\n+304.1647339 5803.3159179688\n+306.0768738 3530.1059570313\n+318.1595459 5520.9609375\n+330.1925964 14000.76171875\n+344.6773376 3574.6950683594\n+356.2409973 12024.30078125\n+360.2006531 46041.26171875\n+360.7026062 19602.333984375\n+363.6889648 16339.1533203125\n+364.1605225 3471.5439453125\n+365.1912537 6514.8598632813\n+365.6857605 3434.3635253906\n+372.6929016 23375.6328125\n+374.1980286 240148.9375\n+374.6990051 88531.46875\n+377.6847839 18261.869140625\n+378.1841431 4990.4458007813\n+384.2341614 28763.40234375\n+386.6903687 14500.7939453125\n+398.2019958 16223.544921875\n+416.7427673 8074.5288085938\n+423.2320251 4371.8520507813\n+425.1813965 4210.1938476563\n+430.7402344 27642.935546875\n+431.2440491 13417.583984375\n+442.2075195 7980.6059570313\n+442.2713928 4595.1391601563\n+442.7108459 5553.3310546875\n+448.2337952 8279.3447265625\n+448.7311707 5624.8461914063\n+451.2121582 8333.0185546875\n+451.7119141 4570.4624023438\n+457.7275391 17480.1015625\n+459.2512817 48900.5546875\n+459.7523804 29497.771484375\n+460.2167053 5359.6381835938\n+498.7574158 3551.4931640625\n+499.2520752 4235.8666992188\n+507.2600708 53245.89453125\n+507.7609253 46670.12890625\n+508.2612305 19332.828125\n+516.2666626 4137.541015625\n+516.7805176 58299.46875\n+517.281189 36883.984375\n+529.3075562 16754.47265625\n+556.2666626 3977.314453125\n+582.3347168 7930.2817382813\n+599.2963867 5640.9077148438\n+610.3297729 130150.6640625\n+611.3359375 27716.517578125\n+617.3026733 19406.369140625\n+618.3014526 5174.8359375\n+626.3168335 4723.9135742188\n+635.3135986 17860.3515625\n+636.3198853 4314.6948242188\n+643.3532715 23298.431640625\n+644.3613892 4250.1220703125\n+667.2992554 8192.587890625\n+685.3235474 3758.7578125\n+719.3981934 13301.7373046875\n+720.395752 4378.724609375\n+729.3352051 7709.2412109375\n+747.3901367 84267.8828125\n+748.3964233 29535.37109375\n+754.3642578 5714.333984375\n+755.3690186 3943.5083007813\n+764.3662109 6421.2250976563\n+772.3707886 3762.69140625\n+789.3843384 4607.880859375\n+791.3812256 3588.5078125\n+798.3960571 6360.8334960938\n+806.4115601 30085.07421875\n+832.4921875 4568.6284179688\n+833.508728 4909.1865234375\n+860.4714355 13005.275390625\n+895.4536743 16561.779296875\n+896.4584961 4322.0971679688\n+END IONS\n'
b
diff -r 000000000000 -r a07976bbc4d9 test-data/novel_peptides
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/novel_peptides Sun Nov 06 16:25:25 2022 +0000
b
@@ -0,0 +1,6 @@
+DSGASGSILEASAAR
+ELGSSDLTAR
+SPYREFTDHLVK
+RQVPEHLGP
+RPGPGTRKSL
+MTDRHAGTY
b
diff -r 000000000000 -r a07976bbc4d9 test-data/novel_proteins.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/novel_proteins.fa Sun Nov 06 16:25:25 2022 +0000
b
@@ -0,0 +1,6 @@
+>DSGASGSILEASAAR
+DSGASGSILEASAAR
+>ELGSSDLTAR
+ELGSSDLTAR
+>SPYREFTDHLVK
+SPYREFTDHLVK
b
diff -r 000000000000 -r a07976bbc4d9 test-data/pep.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/pep.txt Sun Nov 06 16:25:25 2022 +0000
b
@@ -0,0 +1,2 @@
+LVVVGADGVGK
+AHSSMVGVNLPQK
b
diff -r 000000000000 -r a07976bbc4d9 test-data/small-index-filter.mzML
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small-index-filter.mzML Sun Nov 06 16:25:25 2022 +0000
b
b'@@ -0,0 +1,514 @@\n+<?xml version="1.0" encoding="utf-8"?>\n+<indexedmzML xmlns="http://psi.hupo.org/ms/mzml" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://psi.hupo.org/ms/mzml http://psidev.info/files/ms/mzML/xsd/mzML1.1.2_idx.xsd">\n+  <mzML xmlns="http://psi.hupo.org/ms/mzml" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://psi.hupo.org/ms/mzml http://psidev.info/files/ms/mzML/xsd/mzML1.1.0.xsd" id="small" version="1.1.0">\n+    <cvList count="2">\n+      <cv id="MS" fullName="Proteomics Standards Initiative Mass Spectrometry Ontology" version="4.1.41" URI="https://raw.githubusercontent.com/HUPO-PSI/psi-ms-CV/master/psi-ms.obo"/>\n+      <cv id="UO" fullName="Unit Ontology" version="09:04:2014" URI="https://raw.githubusercontent.com/bio-ontology-research-group/unit-ontology/master/unit.obo"/>\n+    </cvList>\n+    <fileDescription>\n+      <fileContent>\n+        <cvParam cvRef="MS" accession="MS:1000579" name="MS1 spectrum" value=""/>\n+        <cvParam cvRef="MS" accession="MS:1000580" name="MSn spectrum" value=""/>\n+      </fileContent>\n+      <sourceFileList count="3">\n+        <sourceFile id="RAW1" name="small.RAW" location="file:///">\n+          <cvParam cvRef="MS" accession="MS:1000768" name="Thermo nativeID format" value=""/>\n+          <cvParam cvRef="MS" accession="MS:1000563" name="Thermo RAW format" value=""/>\n+          <cvParam cvRef="MS" accession="MS:1000569" name="SHA-1" value="b43e9286b40e8b5dbc0dfa2e428495769ca96a96"/>\n+        </sourceFile>\n+        <sourceFile id="small.mzML" name="small.mzML" location="file:///">\n+          <cvParam cvRef="MS" accession="MS:1000569" name="SHA-1" value="4efa13a2795731b5f2a1ff1c463daf0d24b9a9d9"/>\n+        </sourceFile>\n+        <sourceFile id="small-peakpicking-cwt-allMS.mzML" name="small-peakpicking-cwt-allMS.mzML" location="file:///">\n+          <cvParam cvRef="MS" accession="MS:1000569" name="SHA-1" value="8e3d422853cbd71cc5f2af6422e0893caf6447dc"/>\n+        </sourceFile>\n+      </sourceFileList>\n+    </fileDescription>\n+    <referenceableParamGroupList count="1">\n+      <referenceableParamGroup id="CommonInstrumentParams">\n+        <cvParam cvRef="MS" accession="MS:1000448" name="LTQ FT" value=""/>\n+        <cvParam cvRef="MS" accession="MS:1000529" name="instrument serial number" value="SN06061F"/>\n+      </referenceableParamGroup>\n+    </referenceableParamGroupList>\n+    <softwareList count="3">\n+      <software id="Xcalibur" version="1.1 Beta 7">\n+        <cvParam cvRef="MS" accession="MS:1000532" name="Xcalibur" value=""/>\n+      </software>\n+      <software id="pwiz" version="3.0.8981">\n+        <cvParam cvRef="MS" accession="MS:1000615" name="ProteoWizard software" value=""/>\n+      </software>\n+      <software id="pwiz_3.0.20287" version="3.0.20287">\n+        <cvParam cvRef="MS" accession="MS:1000615" name="ProteoWizard software" value=""/>\n+      </software>\n+    </softwareList>\n+    <instrumentConfigurationList count="2">\n+      <instrumentConfiguration id="IC1">\n+        <referenceableParamGroupRef ref="CommonInstrumentParams"/>\n+        <componentList count="3">\n+          <source order="1">\n+            <cvParam cvRef="MS" accession="MS:1000073" name="electrospray ionization" value=""/>\n+            <cvParam cvRef="MS" accession="MS:1000057" name="electrospray inlet" value=""/>\n+          </source>\n+          <analyzer order="2">\n+            <cvParam cvRef="MS" accession="MS:1000079" name="fourier transform ion cyclotron resonance mass spectrometer" value=""/>\n+          </analyzer>\n+          <detector order="3">\n+            <cvParam cvRef="MS" accession="MS:1000624" name="inductive detector" value=""/>\n+          </detector>\n+        </componentList>\n+        <softwareRef ref="Xcalibur"/>\n+      </instrumentConfiguration>\n+      <instrumentConfiguration id="IC2">\n+        <referenceableParamGroupRef ref="CommonInstrumentParams"/>\n+        <componentList count="3">\n+          <source order="1">\n'..b'CWmFUIlOhV8hdFFUCX1FbUlMRWVJZQVByVqFRYVKBVGJRYVeRWoFdoVmBU3FcEVgRXCFTsV0RU2JYMldhWaFYA1qRXcFq1cgVtRVpFZ8VaSXUFU8VJBUKFQElACUaFe0V8iVHFaMV0BUuFVcVqhVSFSkVyRXzJX8VACVaJWsVsCXpFfQVfiYeW8FYUVoSW0Jaw1thSyYkPhJfbV3lXwFYYVsSVWFVUliBVVFWQWT1lhXSJWUVARWSNe4WD1gRZ/VQFaIV7BVRFRIlBhXWFWIVyzVyFawV8BWzFZglMhUTJr9WEV0xVRFVYV5xX3FUQ1axVKFdcV8BUjFSAVxBXLJSgVlxWNFbUVMBWyFVcVPyVAJUMVdxWTFV8VpRXUFTQVExWWJSAVTBUaFScVlBWRFt5aUVQRYdXWFr9SYVUxUMJYgVVRXgJWY1QRbNUiFrtW8VTRbsX3FqlYQVQBbIXBFbkWzlUxXGFRcViRUzFm9dcVYBVKFVQVGhZeUqFl5v9c4WnlBhYrVyFUQlECVTFUMlZhWPFW0VLyUkFGIiTTwVWvVRVZEl0RVjFdsVXRWVFcQm/mOl4BbaUlFSc1eSUhFUsV3hW1JcmFmmUUNfQlNxUGFecVYyUeFb0VDSXmFdQVpBWfFcAVjxX2FcgVdiZcWAFpxYkVXBWWFWcVexVyFQoV2BZMXSFTQlYSWGFboVaxXMFdMVYhWTFacV/SV5FXYlcxV4FTQVCRU4Jh5QIVIhYfVxFeUVKha/VpFZYVpSYfV3FVYVqhZZYLVSFslbolIBUWFQwWvGvV0RZtYPWhFSMWfm+12xW0FbMVoiUJJQQV8BY9W3FbUV/ha8UhFdoW/G7mG1lhXBFttopZMVTCXUFUMWbFrhVkFawVRRX6Jc02ilVRZ+UZFSUVXhUbJRcVECWhFs9WwVARbKbdURJn1qlt8=</binary>\n+            </binaryDataArray>\n+          </binaryDataArrayList>\n+        </spectrum>\n+      </spectrumList>\n+      <chromatogramList count="1" defaultDataProcessingRef="pwiz_Reader_conversion">\n+        <chromatogram index="0" id="TIC" defaultArrayLength="48">\n+          <cvParam cvRef="MS" accession="MS:1000235" name="total ion current chromatogram" value=""/>\n+          <binaryDataArrayList count="2">\n+            <binaryDataArray encodedLength="512">\n+              <cvParam cvRef="MS" accession="MS:1000523" name="64-bit float" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000576" name="no compression" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000595" name="time array" value="" unitCvRef="UO" unitAccession="UO:0000031" unitName="minute"/>\n+              <binary>ZjGx+bg2dD+CXqWoICyAPwIjQjaj+YY/yxgMm+5ilz9SJ6CJsOGhPzDw3Hu45Kg/YUwNR2q0rz/cnbXbLjSzP79Qravv6bM/oyv+3L3JtD9PJltKg8i3Px6vLSlk1Lo/jMOZX80Bvj9XaA3LjKTAP2XsccyfXMI/+6bDHYK9wj8lzLT9KyvDP7/ERdseqsQ/N8MN+Pwwxj/upJiWa+THP45AvK5fsMk/HdRY1aVZyz8p2GzSWr7LPze2sexcK8w/LiySiW7QzT/ABG7dzVPPP3qFGMJEltA/dQrf6FBz0T8dEA7jW0XSP9VGYm9PfdI/JpUWG+Bv0z+k374OnDPUP1yfTLaUBtU/p7OTwVHy1T/p/temnvLWP87s4E2kIdc/1VsDWyVY1z9qIIMC3BnYP0Kd3x0G4Ng/Hg4lbb252T/0gfdohJHaPxAO41tFbNs/5B+QXue52z8v2vZQtfDbP1MiiV5Gsdw/0akrn+V53T9t5RI0U0feP2q0L7PiLt8/</binary>\n+            </binaryDataArray>\n+            <binaryDataArray encodedLength="204">\n+              <cvParam cvRef="MS" accession="MS:1000519" name="32-bit integer" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1002313" name="MS-Numpress positive integer compression" value=""/>\n+              <cvParam cvRef="MS" accession="MS:1000515" name="intensity array" value="" unitCvRef="MS" unitAccession="MS:1000131" unitName="number of detector counts"/>\n+              <binary>LA+Y4uK9TDci+DLstjyesTt98THb2C4FJ+Jo3tk7Ivw/xfY6BeE5R5Ex3zIQxZYRLJxoom8tATs/dTO74TOrIjffMhIRzAEj71gTtcHzCk1j33ETDE0TnSUhAIwVEibL2zKIxTmW0TNssTePES8Du/I+zjY2pO83EJkz+aE3gmI75TErlVeytva8MZ0eNxZmNktROAmBM3Ax</binary>\n+            </binaryDataArray>\n+          </binaryDataArrayList>\n+        </chromatogram>\n+      </chromatogramList>\n+    </run>\n+  </mzML>\n+  <indexList count="2">\n+    <index name="spectrum">\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=3">5613</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=4">14184</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=5">26042</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=11">36558</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=14">48029</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=15">57512</offset>\n+      <offset idRef="controllerType=0 controllerNumber=1 scan=16">65293</offset>\n+    </index>\n+    <index name="chromatogram">\n+      <offset idRef="TIC">76431</offset>\n+    </index>\n+  </indexList>\n+  <indexListOffset>78381</indexListOffset>\n+  <fileChecksum>190e7438359420dfb1a9b11d5829700a34ec36bd</fileChecksum>\n+</indexedmzML>\n'