79
|
1 <tool id="SAINT_preprocessing_v6" name="SAINT pre-processing">
|
5
|
2 <description></description>
|
|
3 <command interpreter="python">
|
60
|
4 #if (str($type_select.type) == 'Scaffold'):
|
62
|
5 SAINT_preprocessing.py $type_select.input $type_select.preybool $type_select.fasta_db $Inter_file $Prey_file
|
5
|
6 "
|
|
7 #for $ba in $bait
|
|
8 ${ba.bait1}
|
|
9 ${ba.assign}
|
|
10 ${ba.T_C}
|
|
11 #end for
|
|
12 "
|
62
|
13 $Bait_file \$INSTALL_RUN_PATH/ $type_select.bait_bool $type_select.bait_file_in
|
60
|
14 #elif (str($type_select.type) == 'MaxQuant'):
|
62
|
15 SAINT_preprocessing_mq_pep.py $type_select.input $type_select.preybool $type_select.fasta_db $Inter_file $Prey_file
|
5
|
16 "
|
|
17 #for $ba in $bait
|
|
18 ${ba.bait1}
|
|
19 ${ba.assign}
|
|
20 ${ba.T_C}
|
|
21 #end for
|
|
22 "
|
62
|
23 $Bait_file \$INSTALL_RUN_PATH/ $type_select.bait_bool $type_select.bait_file_in
|
60
|
24 #elif (str($type_select.type) == 'Peptideshaker'):
|
62
|
25 Protein_report_processing.py "$type_select.input" $Bait_file $type_select.use_metric $type_select.fasta_db $type_select.preybool
|
55
|
26 "
|
|
27 #for $ba in $bait
|
|
28 ${ba.bait1}
|
|
29 ${ba.assign}
|
|
30 ${ba.T_C}
|
|
31 #end for
|
|
32 "
|
62
|
33 \$INSTALL_RUN_PATH/ $type_select.bait_bool $type_select.bait_file_in $Inter_file $Prey_file
|
79
|
34 #elif (str($type_select.type) == 'Peptideshaker_ordered_input'):
|
|
35 Protein_report_processing.py
|
|
36 #set $protein_files=[]
|
|
37 #for $i1, $protein_input in enumerate($type_select.protein_inputs)
|
|
38 #silent $protein_files.append(str($protein_input.protein_file))
|
|
39 #end for
|
|
40 #echo ','.join($protein_files)
|
|
41 $Bait_file $type_select.use_metric $type_select.fasta_db $type_select.preybool
|
|
42 "
|
|
43 #for $ba in $bait
|
|
44 ${ba.bait1}
|
|
45 ${ba.assign}
|
|
46 ${ba.T_C}
|
|
47 #end for
|
|
48 "
|
|
49 \$INSTALL_RUN_PATH/ $type_select.bait_bool $type_select.bait_file_in $Inter_file $Prey_file
|
63
|
50 #elif (str($type_select.type) == 'mzIdentML'):
|
64
|
51 mzID_process2.py "$type_select.input" $type_select.bait_file_in $type_select.preybool $type_select.fasta_db \$INSTALL_RUN_PATH/
|
63
|
52 "
|
|
53 #for $ba in $bait
|
|
54 ${ba.bait1}
|
|
55 ${ba.assign}
|
|
56 ${ba.T_C}
|
|
57 #end for
|
|
58 "
|
|
59 $type_select.bait_bool $Prey_file $Bait_file $Inter_file
|
5
|
60 #end if
|
|
61 </command>
|
|
62 <requirements>
|
|
63 <requirement type="set_environment">INSTALL_RUN_PATH</requirement>
|
|
64 </requirements>
|
|
65 <inputs>
|
55
|
66 <conditional name="type_select">
|
60
|
67 <param type="select" name="type" label="Data Source">
|
55
|
68 <option value="MaxQuant">MaxQuant</option>
|
|
69 <option value="Scaffold">Scaffold</option>
|
80
|
70 <option value="Peptideshaker">Peptideshaker</option>
|
|
71 <option value="Peptideshaker_ordered_input">Peptideshaker Ordered Input</option>
|
63
|
72 <option value="mzIdentML">mzIdentML</option>
|
55
|
73 </param>
|
|
74 <when value="MaxQuant">
|
|
75 <param format="dat" name="input" type="data" label="MaxQuant peptides Output"/>
|
|
76 <param type="boolean" name="preybool" checked="true" label="Create Prey File"/>
|
|
77 <param type="data" name="fasta_db" format="fasta" label="Provide Uniprot Fasta database" optional="true"/>
|
|
78 <param name="bait_bool" type="boolean" checked="true" label="Are You Providing Your Own bait file?"/>
|
|
79 <param type="data" format="dat" name="bait_file_in" label="Bait File" optional="true"/>
|
59
|
80 </when>
|
55
|
81 <when value="Scaffold">
|
|
82 <param format="dat" name="input" type="data" label="Scaffold Output"/>
|
|
83 <param type="boolean" name="preybool" checked="true" label="Create Prey File"/>
|
|
84 <param type="data" name="fasta_db" format="fasta" label="Provide Uniprot Fasta database" optional="true"/>
|
|
85 <param name="bait_bool" type="boolean" checked="true" label="Are You Providing Your Own bait file?"/>
|
|
86 <param type="data" format="dat" name="bait_file_in" label="Bait File" optional="true"/>
|
|
87 </when>
|
|
88 <when value="Peptideshaker">
|
|
89 <param format="dat" name="input" type="data" label="Peptideshaker Output" multiple="true"/>
|
|
90 <param type="select" name="use_metric" label="Select Report File Value for Quantification">
|
|
91 <option value="Validated_Peptides">#Validated Peptides</option>
|
|
92 <option value="Peptides">#Peptides</option>
|
|
93 <option value="Unique">#Unique</option>
|
|
94 <option value="Validated_PSMs">#Validated PSMs</option>
|
|
95 <option value="PSMs">#PSMs</option>
|
|
96 </param>
|
|
97 <param type="boolean" name="preybool" checked="true" label="Create Prey File"/>
|
|
98 <param type="data" name="fasta_db" format="fasta" label="Provide Uniprot Fasta database" optional="true"/>
|
|
99 <param name="bait_bool" type="boolean" checked="true" label="Are You Providing Your Own bait file?"/>
|
|
100 <param type="data" format="dat" name="bait_file_in" label="Bait File" optional="true"/>
|
|
101 </when>
|
79
|
102 <when value="Peptideshaker_ordered_input">
|
|
103 <repeat name = "protein_inputs" min="1" title="Input PeptideShaker Protein Result File">
|
|
104 <param format="tabular" name="protein_file" type="data" label="Peptideshaker Output" multiple="false"/>
|
|
105 </repeat>
|
|
106 <param type="select" name="use_metric" label="Select Report File Value for Quantification">
|
|
107 <option value="Validated_Peptides">#Validated Peptides</option>
|
|
108 <option value="Peptides">#Peptides</option>
|
|
109 <option value="Unique">#Unique</option>
|
|
110 <option value="Validated_PSMs">#Validated PSMs</option>
|
|
111 <option value="PSMs">#PSMs</option>
|
|
112 </param>
|
|
113 <param type="boolean" name="preybool" checked="true" label="Create Prey File"/>
|
|
114 <param type="data" name="fasta_db" format="fasta" label="Provide Uniprot Fasta database" optional="true"/>
|
|
115 <param name="bait_bool" type="boolean" checked="true" label="Are You Providing Your Own bait file?"/>
|
|
116 <param type="data" format="dat" name="bait_file_in" label="Bait File" optional="true"/>
|
|
117 </when>
|
63
|
118 <when value="mzIdentML">
|
|
119 <param format="dat" name="input" type="data" label="mzIdentML Files" multiple="true"/>
|
|
120 <param type="boolean" name="preybool" checked="true" label="Create Prey File"/>
|
|
121 <param type="data" name="fasta_db" format="fasta" label="Provide Uniprot Fasta database" optional="true"/>
|
|
122 <param name="bait_bool" type="boolean" checked="true" label="Are You Providing Your Own bait file?"/>
|
|
123 <param type="data" format="dat" name="bait_file_in" label="Bait File" optional="true"/>
|
|
124 </when>
|
55
|
125 </conditional>
|
61
|
126 <repeat name="bait" title="Bait Create">
|
|
127 <param name="bait1" type="text" size="100" label="Bait"/>
|
|
128 <param name="assign" type="text" size="100" label="Group Assignment"/>
|
|
129 <param name="T_C" type="boolean" checked="true" label="Is this a Control?"/>
|
|
130 </repeat>
|
5
|
131 </inputs>
|
|
132 <outputs>
|
|
133 <data format="txt" name="Inter_file" label="Inter File"/>
|
|
134 <data format="txt" name="Prey_file" label="Prey File" />
|
|
135 <data format="txt" name="Bait_file" label="Bait File" />
|
|
136 </outputs>
|
|
137 <stdio>
|
52
|
138 <regex match="Error: bad bait"
|
|
139 source="stdout"
|
|
140 level="fatal"
|
|
141 description="Error: bad bait"/>
|
|
142 <regex match="IOError: [Errno 2] No such file or directory: './tukeys_output.txt'"
|
|
143 source="stderr"
|
|
144 level="fatal"
|
|
145 description="Error: Scaffold/MaxQuant mismatch. Check job settings."/>
|
|
146 <regex match="bait_temp_file = open(sys.argv[10], 'r')"
|
|
147 source="stderr"
|
|
148 level="fatal"
|
|
149 description="Error: Bait create settings mismatch. Check job settings."/>
|
5
|
150 <regex match="Error|error"
|
|
151 source="stdout"
|
|
152 level="fatal"
|
|
153 description="Unknown error"/>
|
|
154 <regex match="Error|error"
|
|
155 source="stderr"
|
|
156 level="fatal"
|
|
157 description="Unknown error"/>
|
|
158 </stdio>
|
|
159
|
|
160 <tests>
|
|
161 <test>
|
|
162 <param name="input" value="fa_gc_content_input.fa"/>
|
|
163 <output name="out_file1" file="fa_gc_content_output.txt"/>
|
|
164 </test>
|
|
165 </tests>
|
|
166 <help>
|
21
|
167 Pre-Processing
|
25
|
168 ^^^^^^^^^^^^^^
|
20
|
169
|
21
|
170 This tool will read in a Scaffold *Samples Report* file (tab-delimited
|
55
|
171 txt file), multiple Peptideshaker *Protein Report* files or a MaxQuant
|
|
172 *peptides.txt* file and process them to generate a *Bait File, Prey
|
|
173 File,* and *Inter File* for SAINTexpress analysis.
|
20
|
174
|
25
|
175 --------------
|
|
176
|
27
|
177 **1) MaxQuant or Scaffold**
|
20
|
178
|
21
|
179 APOSTL is able to recognize either a Scaffold *Samples Report* file
|
|
180 (tab-delimited txt file) or the *peptides.txt* file output in the
|
|
181 MaxQuant *txt* output folder. No modifications should be made to these
|
|
182 files. Please designate which one is being provided.
|
20
|
183
|
27
|
184 **2) Scaffold or MaxQuant File Input**
|
20
|
185
|
21
|
186 Select the corresponding *Samples Report* or *peptides.txt* here.
|
|
187
|
27
|
188 **3) Create Prey File**
|
5
|
189
|
20
|
190 Select whether or not you would like APOSTL to generate a prey file.
|
|
191
|
21
|
192 When making a prey file, APOSTL queries a user provided FASTA database
|
|
193 (see below) in order to extract protein amino acid lengths and gene
|
|
194 names. This may take several minutes depending on your computer and if
|
|
195 your Galaxy distribution is cluster enabled. Some users may want to run
|
|
196 SAINTexpress using the same data set while changing which baits are
|
|
197 considered test or control. It is useful to toggle **Create Prey File**
|
|
198 off in order to save time by circumventing this step as the same prey
|
|
199 file can be used for both SAINTexpress runs.
|
20
|
200
|
27
|
201 **4) Provide Uniprot FASTA database**
|
20
|
202
|
21
|
203 Please specify a FASTA file containing the protein sequence. You can
|
|
204 download the latest release of Uniprot's reviewed sequences (Swiss-Prot)
|
24
|
205 http://www.uniprot.org/downloads. For computing efficiency,
|
21
|
206 please limit your FASTA file to your species of interest. It is
|
|
207 generally advised to use the same FASTA database that was used for your
|
|
208 database searches during peptide and protein ID.
|
5
|
209
|
27
|
210 **5) Are You Providing Your Own Bait File?**
|
20
|
211
|
21
|
212 Users have two options for providing a *Bait* file. If you would like to
|
|
213 create your own *Bait* file, select Yes and designate the file below. If
|
|
214 you would like to use the **Bait Create** tool to create a *Bait* file
|
|
215 within Galaxy, please select No and proceed to the **Bait Create** tool.
|
20
|
216
|
27
|
217 **6) Bait File**
|
21
|
218
|
|
219 If you selected Yes above, please specify the *Bait* file you would like
|
|
220 to provide. If you selected No above, ignore this argument and proceed
|
|
221 to the **Bait Create** tool.
|
5
|
222
|
21
|
223 **Note:** Individual bait names must match to the sample names
|
|
224 within your Scaffold or MaxQuant output exactly and must contain no
|
|
225 whitespace characters (e.g. spaces) or dashes.
|
59
|
226
|
55
|
227 **Note:** When using Peptideshaker output the baits in the baitfile
|
|
228 need to be in the same order as the files selected.
|
5
|
229
|
27
|
230 **7) Bait Create**
|
21
|
231
|
|
232 Using the **Bait Create** tool, you can create your *bait.txt* file.
|
20
|
233
|
21
|
234 **Note:** Individual bait names must match to the sample names
|
|
235 within your Scaffold or MaxQuant output exactly and must contain no
|
|
236 whitespace characters (e.g. spaces) or dashes.
|
5
|
237
|
21
|
238 APOSTL uses this bait file to find the user's baits of interest within a
|
|
239 *Samples Report* or *peptides.txt* file and when preparing the
|
|
240 *inter.txt* file.
|
20
|
241
|
21
|
242 --------------
|
20
|
243
|
21
|
244 Once your parameters have been finalized, please press the Execute
|
|
245 button to start processing. This may take a few minutes. Once your
|
|
246 process has been completed, you will see your *Bait File, Prey File,*
|
|
247 and *Inter File* on the right hand side of your panel highlighted in
|
|
248 green.
|
5
|
249 </help>
|
|
250 </tool>
|