Mercurial > repos > galaxyp > percolator
comparison metafiles2pin.xml @ 0:3a49065a05d6 draft
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tools/percolator commit b4871f9659a924a68430aed3a93f4f9bad733fd6
author | galaxyp |
---|---|
date | Wed, 07 Dec 2016 16:43:51 -0500 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:3a49065a05d6 |
---|---|
1 <tool id="metafiles2pin" name="Merge search data" version="1.0"> | |
2 <description>before creating percolator input</description> | |
3 <stdio> | |
4 <exit_code range="1:" /> | |
5 </stdio> | |
6 <command>python $__tool_directory__/metafiles2pin.py | |
7 --batchsize $percopoolsize | |
8 #if len($percopoolids) > 0 | |
9 --percolator-pool-ids | |
10 #for $ppool in $percopoolids | |
11 "${ppool.ppool_identifier}" | |
12 #end for | |
13 #end if | |
14 --spectrafiles | |
15 #for $specfile in $searchresult.keys() | |
16 "$specfile" | |
17 #end for | |
18 --searchfiles | |
19 #for $specfile in $searchresult.keys() | |
20 "$searchresult[$specfile]" | |
21 #end for | |
22 </command> | |
23 <inputs> | |
24 <param name="percopoolsize" type="integer" value="8" label="Amount of fractions to batch per Percolator process" /> | |
25 <repeat name="percopoolids" title="Percolator pools" help="For cases where file amounts cause search results to not automatically line up into correct percolator batches"> | |
26 <param name="ppool_identifier" type="text" label="Filename part identifying percolator pool" | |
27 help="Specify part of the input spectra filenames that are unique for each percolator pool, e.g set_A."/> | |
28 </repeat> | |
29 <param name="searchresult" type="data_collection" format="mzid" label="MSGF+, SQT or XTandem search results" /> | |
30 </inputs> | |
31 <outputs> | |
32 <collection name="metafile_collection" type="list" label="Percolator metafiles list"> | |
33 <discover_datasets pattern="__designation_and_ext__" directory="metafiles" /> | |
34 </collection> | |
35 </outputs> | |
36 <tests> | |
37 <test> | |
38 <param name="percopoolsize" value="2"/> | |
39 <param name="searchresult"> | |
40 <collection type="list"> | |
41 <element name="fraction_one_spectra" value="empty_file1.mzid"/> | |
42 <element name="fraction_two_spectra" value="empty_file2.mzid"/> | |
43 <element name="fraction_three_spectra" value="empty_file3.mzid"/> | |
44 <element name="fraction_four_spectra" value="empty_file4.mzid"/> | |
45 </collection> | |
46 </param> | |
47 <output_collection name="metafile_collection" type="list"> | |
48 <element name="percolatorpool0"> | |
49 <assert_contents> | |
50 <has_text_matching expression="dataset_1.dat" /> | |
51 <has_text_matching expression="dataset_2.dat" /> | |
52 </assert_contents> | |
53 </element> | |
54 <element name="percolatorpool1"> | |
55 <assert_contents> | |
56 <has_text_matching expression="dataset_3.dat" /> | |
57 <has_text_matching expression="dataset_4.dat" /> | |
58 </assert_contents> | |
59 </element> | |
60 </output_collection> | |
61 </test> | |
62 <test> | |
63 <param name="percopoolsize" value="2"/> | |
64 <repeat name="percopoolids"> | |
65 <param name="ppool_identifier" value="set1"/> | |
66 </repeat> | |
67 <repeat name="percopoolids"> | |
68 <param name="ppool_identifier" value="set2"/> | |
69 </repeat> | |
70 <param name="searchresult"> | |
71 <collection type="list"> | |
72 <element name="fr_one_set1_spectra" value="empty_file1.mzid"/> | |
73 <element name="fr_two_set1_spectra" value="empty_file2.mzid"/> | |
74 <element name="fr_three_set1_spectra" value="empty_file3.mzid"/> | |
75 <element name="fr_one_set2_spectra" value="empty_file4.mzid"/> | |
76 <element name="fr_two_set2_spectra" value="empty_file5.mzid"/> | |
77 <element name="fr_three_set2_spectra" value="empty_file6.mzid"/> | |
78 </collection> | |
79 </param> | |
80 <output_collection name="metafile_collection" type="list"> | |
81 <element name="percolatorpool0"> | |
82 <assert_contents> | |
83 <has_text_matching expression="dataset_7.dat" /> | |
84 <has_text_matching expression="dataset_8.dat" /> | |
85 </assert_contents> | |
86 </element> | |
87 <element name="percolatorpool1"> | |
88 <assert_contents> | |
89 <has_text_matching expression="dataset_9.dat" /> | |
90 </assert_contents> | |
91 </element> | |
92 <element name="percolatorpool2"> | |
93 <assert_contents> | |
94 <has_text_matching expression="dataset_10.dat" /> | |
95 <has_text_matching expression="dataset_11.dat" /> | |
96 </assert_contents> | |
97 </element> | |
98 <element name="percolatorpool3"> | |
99 <assert_contents> | |
100 <has_text_matching expression="dataset_12.dat" /> | |
101 </assert_contents> | |
102 </element> | |
103 </output_collection> | |
104 </test> | |
105 </tests> | |
106 <help> | |
107 Creates meta files containing the filenames of the search data in batches of | |
108 a specific size. These are used as inputs to sqt2pin, msgfplus2pin or tandem2pin. | |
109 Use this feature when you want to batch a specific amount of input search results | |
110 to run in percolator, as opposed to one at a time. This tool generates a collection | |
111 containing multiple batches of the search results. You can specify batch size as well | |
112 as a pattern in the spectra files which makes sure the batching isn't continued through | |
113 very different MS sets. Instead, for each filename-pattern it generates batches of the | |
114 specified size. | |
115 </help> | |
116 </tool> |