comparison workflows/summarize_counts_workflow.ga @ 0:e979cb57a5d5 draft default tip

"planemo upload for repository https://github.com/McIntyre-Lab/BayesASE/tree/main/galaxy commit 9b70598ef46a73632d9e0fa0c6ce6776fb5e9d6a"
author malex
date Thu, 14 Jan 2021 21:51:36 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:e979cb57a5d5
1 {
2 "a_galaxy_workflow": "true",
3 "annotation": "The Summarize Counts workflow\n prepares the input datasets for entry into the Bayesian model by flagging features that do not meet a user-\ndefined APN (Average Reads per Nucleotide) threshold, and thus have low read coverage. These features are not removed from the dataset, however they are excluded from further analysis in order to prevent the likelihood of low confidence in data. **NOTE: There are input parameters that are automatically collapsed/hidden by Galaxy\n that should be examined prior to running workflow\n**",
4 "format-version": "0.1",
5 "name": "Summarize Counts for BASE",
6 "steps": {
7 "0": {
8 "annotation": "**Must be sorted by biological replicate** More information on how the design file should be formatted can be checked by reading the BASE Galaxy User Guide, or looking at the Combine Counts Table tool help section. The **Check Alignment Design File tool** is also available to verify whether the input design file is of the proper format and does not contain any errors such as duplicate FASTQ file names ",
9 "content_id": null,
10 "errors": null,
11 "id": 0,
12 "input_connections": {},
13 "inputs": [
14 {
15 "description": "**Must be sorted by biological replicate** More information on how the design file should be formatted can be checked by reading the BASE Galaxy User Guide, or looking at the Combine Counts Table tool help section. The **Check Alignment Design File tool** is also available to verify whether the input design file is of the proper format and does not contain any errors such as duplicate FASTQ file names ",
16 "name": "Input Alignment Design File"
17 }
18 ],
19 "label": "Input Alignment Design File",
20 "name": "Input dataset",
21 "outputs": [],
22 "position": {
23 "left": 314.4000244140625,
24 "top": 183
25 },
26 "tool_id": null,
27 "tool_state": "{\"optional\": false}",
28 "tool_version": null,
29 "type": "data_input",
30 "uuid": "62aa4b85-8816-4517-b017-19b8b917b665",
31 "workflow_outputs": [
32 {
33 "label": null,
34 "output_name": "output",
35 "uuid": "bf4184fc-f95f-4354-b690-5e7c551e7ad1"
36 }
37 ]
38 },
39 "1": {
40 "annotation": "Collection of ASE Counts tables can be created by using the SAM Compare with Feature tool. The design file should contain only the FQ files that are within the collection of ASE Counts table ",
41 "content_id": null,
42 "errors": null,
43 "id": 1,
44 "input_connections": {},
45 "inputs": [
46 {
47 "description": "Collection of ASE Counts tables can be created by using the SAM Compare with Feature tool. The design file should contain only the FQ files that are within the collection of ASE Counts table ",
48 "name": "Input Collection of ASE Counts tables "
49 }
50 ],
51 "label": "Input Collection of ASE Counts tables ",
52 "name": "Input dataset collection",
53 "outputs": [],
54 "position": {
55 "left": 229.79998779296875,
56 "top": 344
57 },
58 "tool_id": null,
59 "tool_state": "{\"optional\": false, \"collection_type\": \"list\"}",
60 "tool_version": null,
61 "type": "data_collection_input",
62 "uuid": "c3cf1acb-03ec-4d1b-9eaa-60404488ae37",
63 "workflow_outputs": [
64 {
65 "label": null,
66 "output_name": "output",
67 "uuid": "f96caa64-e4d3-44f3-922c-ea47ccc1de58"
68 }
69 ]
70 },
71 "2": {
72 "annotation": "4-column BED file that contains the locations of the features of interest. Do not use the reformatted BED file that was output from the Align and Counts workflow **See the BASE User Guide for correct format**",
73 "content_id": null,
74 "errors": null,
75 "id": 2,
76 "input_connections": {},
77 "inputs": [
78 {
79 "description": "4-column BED file that contains the locations of the features of interest. Do not use the reformatted BED file that was output from the Align and Counts workflow **See the BASE User Guide for correct format**",
80 "name": "Input BED file"
81 }
82 ],
83 "label": "Input BED file",
84 "name": "Input dataset",
85 "outputs": [],
86 "position": {
87 "left": 304,
88 "top": 281.3999938964844
89 },
90 "tool_id": null,
91 "tool_state": "{\"optional\": false}",
92 "tool_version": null,
93 "type": "data_input",
94 "uuid": "120dcdb4-aa29-4b5f-a3bd-095b5a63c53c",
95 "workflow_outputs": [
96 {
97 "label": null,
98 "output_name": "output",
99 "uuid": "97af324a-4a2a-474b-8bc3-28b38b8986a2"
100 }
101 ]
102 },
103 "3": {
104 "annotation": "Indicate whether data contains real data or simulated reads. \n\n**Enter \"False\" for real data**\n**Enter \"True\" for simulated data**",
105 "content_id": null,
106 "errors": null,
107 "id": 3,
108 "input_connections": {},
109 "inputs": [
110 {
111 "description": "Indicate whether data contains real data or simulated reads. \n\n**Enter \"False\" for real data**\n**Enter \"True\" for simulated data**",
112 "name": "Indicate Dataset Type"
113 }
114 ],
115 "label": "Indicate Dataset Type",
116 "name": "Input parameter",
117 "outputs": [],
118 "position": {
119 "left": 334.79998779296875,
120 "top": 420.6000061035156
121 },
122 "tool_id": null,
123 "tool_state": "{\"default\": \"False\", \"parameter_type\": \"text\", \"optional\": true}",
124 "tool_version": null,
125 "type": "parameter_input",
126 "uuid": "c581508a-8805-4442-b58d-28a675d7ac35",
127 "workflow_outputs": [
128 {
129 "label": null,
130 "output_name": "output",
131 "uuid": "4c94c2dd-3d09-4fe3-9d00-86a0994fc794"
132 }
133 ]
134 },
135 "4": {
136 "annotation": "Enter where the biological replicates of interest start in the design file. Use if only doing analysis on a certain subset within the input design file ",
137 "content_id": null,
138 "errors": null,
139 "id": 4,
140 "input_connections": {},
141 "inputs": [
142 {
143 "description": "Enter where the biological replicates of interest start in the design file. Use if only doing analysis on a certain subset within the input design file ",
144 "name": "Start point in Design File [OPTIONAL]"
145 }
146 ],
147 "label": "Start point in Design File [OPTIONAL]",
148 "name": "Input parameter",
149 "outputs": [],
150 "position": {
151 "left": 286,
152 "top": 499.4000244140625
153 },
154 "tool_id": null,
155 "tool_state": "{\"parameter_type\": \"text\", \"optional\": true}",
156 "tool_version": null,
157 "type": "parameter_input",
158 "uuid": "fb6ce2d1-a81a-4db1-87e5-36cce2a0eca1",
159 "workflow_outputs": [
160 {
161 "label": null,
162 "output_name": "output",
163 "uuid": "2cf2a952-da1b-4304-8e10-38247cf6d197"
164 }
165 ]
166 },
167 "5": {
168 "annotation": "Enter the point in design file where user wants to exclude further FASTQ files from data analysis. Use only if analyzing a subset of FASTQ files within the design file\n",
169 "content_id": null,
170 "errors": null,
171 "id": 5,
172 "input_connections": {},
173 "inputs": [
174 {
175 "description": "Enter the point in design file where user wants to exclude further FASTQ files from data analysis. Use only if analyzing a subset of FASTQ files within the design file\n",
176 "name": "End point in Design File [OPTIONAL]"
177 }
178 ],
179 "label": "End point in Design File [OPTIONAL]",
180 "name": "Input parameter",
181 "outputs": [],
182 "position": {
183 "left": 433.20001220703125,
184 "top": 553
185 },
186 "tool_id": null,
187 "tool_state": "{\"parameter_type\": \"text\", \"optional\": false}",
188 "tool_version": null,
189 "type": "parameter_input",
190 "uuid": "fe9b28fc-b604-4d93-96ac-1d1e97d42242",
191 "workflow_outputs": [
192 {
193 "label": null,
194 "output_name": "output",
195 "uuid": "7b08491a-8dac-41bc-80dd-c02244a938fa"
196 }
197 ]
198 },
199 "6": {
200 "annotation": "Indicate the APN threshold. Features that are above this threshold are deemed expressed and have high enough read coverage, and thus are eligible for continued analysis in the Bayesian Model **Default setting is 5**",
201 "content_id": null,
202 "errors": null,
203 "id": 6,
204 "input_connections": {},
205 "inputs": [
206 {
207 "description": "Indicate the APN threshold. Features that are above this threshold are deemed expressed and have high enough read coverage, and thus are eligible for continued analysis in the Bayesian Model **Default setting is 5**",
208 "name": "APN threshold"
209 }
210 ],
211 "label": "APN threshold",
212 "name": "Input parameter",
213 "outputs": [],
214 "position": {
215 "left": 746,
216 "top": 519.7999877929688
217 },
218 "tool_id": null,
219 "tool_state": "{\"default\": \"5\", \"parameter_type\": \"text\", \"optional\": true}",
220 "tool_version": null,
221 "type": "parameter_input",
222 "uuid": "cf91592b-c1e4-4f95-95b7-a2c7f38bca29",
223 "workflow_outputs": [
224 {
225 "label": null,
226 "output_name": "output",
227 "uuid": "114545cb-06b4-4134-8927-6a4645133b06"
228 }
229 ]
230 },
231 "7": {
232 "annotation": "Enter the header name of the column that specified the name of the first parental genome. **Default value is G1**",
233 "content_id": null,
234 "errors": null,
235 "id": 7,
236 "input_connections": {},
237 "inputs": [
238 {
239 "description": "Enter the header name of the column that specified the name of the first parental genome. **Default value is G1**",
240 "name": "Name of G1 column in Design File"
241 }
242 ],
243 "label": "Name of G1 column in Design File",
244 "name": "Input parameter",
245 "outputs": [],
246 "position": {
247 "left": 714,
248 "top": 589
249 },
250 "tool_id": null,
251 "tool_state": "{\"default\": \"G1\", \"parameter_type\": \"text\", \"optional\": true}",
252 "tool_version": null,
253 "type": "parameter_input",
254 "uuid": "aee7e8ad-c871-47d4-9e19-47f59f565e31",
255 "workflow_outputs": [
256 {
257 "label": null,
258 "output_name": "output",
259 "uuid": "29e1654b-7b7e-495d-96ce-a397bc81323d"
260 }
261 ]
262 },
263 "8": {
264 "annotation": "Enter the header name for the column that specifies the name of the second parental genome **Default value is G2**",
265 "content_id": null,
266 "errors": null,
267 "id": 8,
268 "input_connections": {},
269 "inputs": [
270 {
271 "description": "Enter the header name for the column that specifies the name of the second parental genome **Default value is G2**",
272 "name": "Name of G2 column in Design File"
273 }
274 ],
275 "label": "Name of G2 column in Design File",
276 "name": "Input parameter",
277 "outputs": [],
278 "position": {
279 "left": 798.5999755859375,
280 "top": 702
281 },
282 "tool_id": null,
283 "tool_state": "{\"default\": \"G2\", \"parameter_type\": \"text\", \"optional\": true}",
284 "tool_version": null,
285 "type": "parameter_input",
286 "uuid": "ee3b186b-d883-4493-a033-33d0e8612a04",
287 "workflow_outputs": [
288 {
289 "label": null,
290 "output_name": "output",
291 "uuid": "003f33a7-fef5-482a-9932-63046b8b5354"
292 }
293 ]
294 },
295 "9": {
296 "annotation": "Enter the header name of the column that contains the comparate condition + biological replicate number **Default value is sampleID**",
297 "content_id": null,
298 "errors": null,
299 "id": 9,
300 "input_connections": {},
301 "inputs": [
302 {
303 "description": "Enter the header name of the column that contains the comparate condition + biological replicate number **Default value is sampleID**",
304 "name": "Name of sample ID column in Design File"
305 }
306 ],
307 "label": "Name of sample ID column in Design File",
308 "name": "Input parameter",
309 "outputs": [],
310 "position": {
311 "left": 800,
312 "top": 794.5999755859375
313 },
314 "tool_id": null,
315 "tool_state": "{\"default\": \"sampleID\", \"parameter_type\": \"text\", \"optional\": true}",
316 "tool_version": null,
317 "type": "parameter_input",
318 "uuid": "aa89d9fa-afc8-4261-934b-ac3076fa41b4",
319 "workflow_outputs": [
320 {
321 "label": null,
322 "output_name": "output",
323 "uuid": "a5f3216e-e886-4dfc-9513-6910714b4f9c"
324 }
325 ]
326 },
327 "10": {
328 "annotation": "Enter the header name of the column that contains only the comparate condition (NO biological replicate number) **Default value is comparate** ",
329 "content_id": null,
330 "errors": null,
331 "id": 10,
332 "input_connections": {},
333 "inputs": [
334 {
335 "description": "Enter the header name of the column that contains only the comparate condition (NO biological replicate number) **Default value is comparate** ",
336 "name": "Name of comparate column in Design File"
337 }
338 ],
339 "label": "Name of comparate column in Design File",
340 "name": "Input parameter",
341 "outputs": [],
342 "position": {
343 "left": 817.199951171875,
344 "top": 897.7999877929688
345 },
346 "tool_id": null,
347 "tool_state": "{\"default\": \"comparate\", \"parameter_type\": \"text\", \"optional\": true}",
348 "tool_version": null,
349 "type": "parameter_input",
350 "uuid": "502a2c0a-e3c3-408c-aa1e-5a118ebead2d",
351 "workflow_outputs": [
352 {
353 "label": null,
354 "output_name": "output",
355 "uuid": "d171b2eb-fe5a-45a9-a825-703648dd9cc6"
356 }
357 ]
358 },
359 "11": {
360 "annotation": "Sums a collection of ASE Counts Tables derived from FASTQ files (technical replicates) that are progeny of the same biological replicate(s). This tool also calculates APN (Average reads per Nucleotide) values for each feature ",
361 "content_id": "combine_cnt_tables",
362 "errors": null,
363 "id": 11,
364 "input_connections": {
365 "bed": {
366 "id": 2,
367 "output_name": "output"
368 },
369 "begin": {
370 "id": 4,
371 "output_name": "output"
372 },
373 "collection": {
374 "id": 1,
375 "output_name": "output"
376 },
377 "design": {
378 "id": 0,
379 "output_name": "output"
380 },
381 "end": {
382 "id": 5,
383 "output_name": "output"
384 },
385 "sim": {
386 "id": 3,
387 "output_name": "output"
388 }
389 },
390 "inputs": [],
391 "label": "Combine Counts Tables ",
392 "name": "Combine ASE Count Tables:",
393 "outputs": [
394 {
395 "name": "split_output",
396 "type": "input"
397 },
398 {
399 "name": "output_designFile",
400 "type": "tabular"
401 }
402 ],
403 "position": {
404 "left": 719.7999877929688,
405 "top": 151.60000610351562
406 },
407 "post_job_actions": {},
408 "tool_id": "combine_cnt_tables",
409 "tool_state": "{\"bed\": {\"__class__\": \"ConnectedValue\"}, \"begin\": {\"__class__\": \"ConnectedValue\"}, \"collection\": {\"__class__\": \"ConnectedValue\"}, \"design\": {\"__class__\": \"ConnectedValue\"}, \"end\": {\"__class__\": \"ConnectedValue\"}, \"sim\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}",
410 "tool_version": "0.1.0",
411 "type": "tool",
412 "uuid": "2b425b9f-f4d6-446d-8474-0c9e03ccd776",
413 "workflow_outputs": [
414 {
415 "label": null,
416 "output_name": "split_output",
417 "uuid": "3094413c-717a-4817-9842-49f0555a4b6c"
418 },
419 {
420 "label": null,
421 "output_name": "output_designFile",
422 "uuid": "39095c0c-c674-4989-8838-09a9b8ad8d19"
423 }
424 ]
425 },
426 "12": {
427 "annotation": "Filters features in the summed ASE Counts tables and flags those that are below the user-defined APN threshold, preventing them from being analyzed in the Bayesian Model due to low read coverage. Flagged features (indicated by a 0 in the flag_analyze column) are not removed from the dataset, however. ",
428 "content_id": "summarize_sam_compare_cnts_table_1cond",
429 "errors": null,
430 "id": 12,
431 "input_connections": {
432 "apn": {
433 "id": 6,
434 "output_name": "output"
435 },
436 "collection": {
437 "id": 11,
438 "output_name": "split_output"
439 },
440 "design": {
441 "id": 11,
442 "output_name": "output_designFile"
443 },
444 "parent1": {
445 "id": 7,
446 "output_name": "output"
447 },
448 "parent2": {
449 "id": 8,
450 "output_name": "output"
451 },
452 "sampleCol": {
453 "id": 10,
454 "output_name": "output"
455 },
456 "sampleIDCol": {
457 "id": 9,
458 "output_name": "output"
459 }
460 },
461 "inputs": [],
462 "label": "Summarize and Filter ASE Counts Tables",
463 "name": "Summarize and Filter ASE Count Tables",
464 "outputs": [
465 {
466 "name": "split_output",
467 "type": "input"
468 }
469 ],
470 "position": {
471 "left": 1114,
472 "top": 306.20001220703125
473 },
474 "post_job_actions": {},
475 "tool_id": "summarize_sam_compare_cnts_table_1cond",
476 "tool_state": "{\"apn\": {\"__class__\": \"ConnectedValue\"}, \"collection\": {\"__class__\": \"ConnectedValue\"}, \"design\": {\"__class__\": \"ConnectedValue\"}, \"parent1\": {\"__class__\": \"ConnectedValue\"}, \"parent2\": {\"__class__\": \"ConnectedValue\"}, \"sampleCol\": {\"__class__\": \"ConnectedValue\"}, \"sampleIDCol\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}",
477 "tool_version": "0.1.0",
478 "type": "tool",
479 "uuid": "70bae872-18fe-4c5b-a743-f332316905fb",
480 "workflow_outputs": [
481 {
482 "label": null,
483 "output_name": "split_output",
484 "uuid": "c788ab68-7de3-434c-aec1-6759635bce78"
485 }
486 ]
487 },
488 "13": {
489 "annotation": "This tool reformats the Sample design file created by the Combine Counts Tables tool by removing the sampleID column, creating the Priors Design File. This design file is used as input into the Calculate Priors module.",
490 "content_id": "base_reformat_design_file",
491 "errors": null,
492 "id": 13,
493 "input_connections": {
494 "DESIGN": {
495 "id": 11,
496 "output_name": "output_designFile"
497 }
498 },
499 "inputs": [],
500 "label": "Reformat Sample Design File",
501 "name": "Reformat Sample Design File",
502 "outputs": [
503 {
504 "name": "OUTFILE",
505 "type": "tsv"
506 }
507 ],
508 "position": {
509 "left": 1242,
510 "top": 832.7999877929688
511 },
512 "post_job_actions": {},
513 "tool_id": "base_reformat_design_file",
514 "tool_state": "{\"DESIGN\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}",
515 "tool_version": "0.1.0",
516 "type": "tool",
517 "uuid": "804887ca-df1f-4c8c-87fa-fab3bdcef5e3",
518 "workflow_outputs": [
519 {
520 "label": null,
521 "output_name": "OUTFILE",
522 "uuid": "2548d392-ad0a-441d-bd7b-96f040bff88e"
523 }
524 ]
525 }
526 },
527 "tags": [],
528 "uuid": "b5e1664e-69e1-4447-bc79-986ec117b3fb",
529 "version": 20
530 }