comparison metafiles2pin.xml @ 0:3a49065a05d6 draft

planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tools/percolator commit b4871f9659a924a68430aed3a93f4f9bad733fd6
author galaxyp
date Wed, 07 Dec 2016 16:43:51 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:3a49065a05d6
1 <tool id="metafiles2pin" name="Merge search data" version="1.0">
2 <description>before creating percolator input</description>
3 <stdio>
4 <exit_code range="1:" />
5 </stdio>
6 <command>python $__tool_directory__/metafiles2pin.py
7 --batchsize $percopoolsize
8 #if len($percopoolids) > 0
9 --percolator-pool-ids
10 #for $ppool in $percopoolids
11 "${ppool.ppool_identifier}"
12 #end for
13 #end if
14 --spectrafiles
15 #for $specfile in $searchresult.keys()
16 "$specfile"
17 #end for
18 --searchfiles
19 #for $specfile in $searchresult.keys()
20 "$searchresult[$specfile]"
21 #end for
22 </command>
23 <inputs>
24 <param name="percopoolsize" type="integer" value="8" label="Amount of fractions to batch per Percolator process" />
25 <repeat name="percopoolids" title="Percolator pools" help="For cases where file amounts cause search results to not automatically line up into correct percolator batches">
26 <param name="ppool_identifier" type="text" label="Filename part identifying percolator pool"
27 help="Specify part of the input spectra filenames that are unique for each percolator pool, e.g set_A."/>
28 </repeat>
29 <param name="searchresult" type="data_collection" format="mzid" label="MSGF+, SQT or XTandem search results" />
30 </inputs>
31 <outputs>
32 <collection name="metafile_collection" type="list" label="Percolator metafiles list">
33 <discover_datasets pattern="__designation_and_ext__" directory="metafiles" />
34 </collection>
35 </outputs>
36 <tests>
37 <test>
38 <param name="percopoolsize" value="2"/>
39 <param name="searchresult">
40 <collection type="list">
41 <element name="fraction_one_spectra" value="empty_file1.mzid"/>
42 <element name="fraction_two_spectra" value="empty_file2.mzid"/>
43 <element name="fraction_three_spectra" value="empty_file3.mzid"/>
44 <element name="fraction_four_spectra" value="empty_file4.mzid"/>
45 </collection>
46 </param>
47 <output_collection name="metafile_collection" type="list">
48 <element name="percolatorpool0">
49 <assert_contents>
50 <has_text_matching expression="dataset_1.dat" />
51 <has_text_matching expression="dataset_2.dat" />
52 </assert_contents>
53 </element>
54 <element name="percolatorpool1">
55 <assert_contents>
56 <has_text_matching expression="dataset_3.dat" />
57 <has_text_matching expression="dataset_4.dat" />
58 </assert_contents>
59 </element>
60 </output_collection>
61 </test>
62 <test>
63 <param name="percopoolsize" value="2"/>
64 <repeat name="percopoolids">
65 <param name="ppool_identifier" value="set1"/>
66 </repeat>
67 <repeat name="percopoolids">
68 <param name="ppool_identifier" value="set2"/>
69 </repeat>
70 <param name="searchresult">
71 <collection type="list">
72 <element name="fr_one_set1_spectra" value="empty_file1.mzid"/>
73 <element name="fr_two_set1_spectra" value="empty_file2.mzid"/>
74 <element name="fr_three_set1_spectra" value="empty_file3.mzid"/>
75 <element name="fr_one_set2_spectra" value="empty_file4.mzid"/>
76 <element name="fr_two_set2_spectra" value="empty_file5.mzid"/>
77 <element name="fr_three_set2_spectra" value="empty_file6.mzid"/>
78 </collection>
79 </param>
80 <output_collection name="metafile_collection" type="list">
81 <element name="percolatorpool0">
82 <assert_contents>
83 <has_text_matching expression="dataset_7.dat" />
84 <has_text_matching expression="dataset_8.dat" />
85 </assert_contents>
86 </element>
87 <element name="percolatorpool1">
88 <assert_contents>
89 <has_text_matching expression="dataset_9.dat" />
90 </assert_contents>
91 </element>
92 <element name="percolatorpool2">
93 <assert_contents>
94 <has_text_matching expression="dataset_10.dat" />
95 <has_text_matching expression="dataset_11.dat" />
96 </assert_contents>
97 </element>
98 <element name="percolatorpool3">
99 <assert_contents>
100 <has_text_matching expression="dataset_12.dat" />
101 </assert_contents>
102 </element>
103 </output_collection>
104 </test>
105 </tests>
106 <help>
107 Creates meta files containing the filenames of the search data in batches of
108 a specific size. These are used as inputs to sqt2pin, msgfplus2pin or tandem2pin.
109 Use this feature when you want to batch a specific amount of input search results
110 to run in percolator, as opposed to one at a time. This tool generates a collection
111 containing multiple batches of the search results. You can specify batch size as well
112 as a pattern in the spectra files which makes sure the batching isn't continued through
113 very different MS sets. Instead, for each filename-pattern it generates batches of the
114 specified size.
115 </help>
116 </tool>